Spaces:
Runtime error
Runtime error
import re | |
def preprocessing_text(text): | |
list_separators=re.findall(r"Comprador*.?\(.*?\)|Mediador*.?\(.*?\)|Vendedor*.?\(.*?\)", text) | |
list_splits=re.split(r"Comprador*.?\(.*?\)|Mediador*.?\(.*?\)|Vendedor*.?\(.*?\)", text)[1:] | |
conversation=list(map(lambda a, b: a+b, list_separators, list_splits)) | |
#remove text sent to seller | |
[conversation.remove(conv) for conv in conversation if "para Vendedor" in conv.split("\n",2)[0]] | |
final_text="" | |
for text in conversation: | |
text=re.sub(r".*?\.jpeg|.*?\.jpg|.*?\.png|.*?\.pdf","",text) | |
new_text=text.split(" ")[0]+":"+text.split("\n",2)[2] | |
final_text=final_text+new_text | |
return final_text |