Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -27,8 +27,11 @@ df3_questions = df3["question"].values
|
|
27 |
df3_links = df3["url"].values
|
28 |
|
29 |
def arabic_word_tokenize(text):
|
|
|
|
|
30 |
return re.findall(r'\w+', text)
|
31 |
|
|
|
32 |
def compute_word_overlap(query, questions):
|
33 |
query_words = set(arabic_word_tokenize(query))
|
34 |
overlaps = []
|
|
|
27 |
df3_links = df3["url"].values
|
28 |
|
29 |
def arabic_word_tokenize(text):
|
30 |
+
if not isinstance(text, str):
|
31 |
+
return []
|
32 |
return re.findall(r'\w+', text)
|
33 |
|
34 |
+
|
35 |
def compute_word_overlap(query, questions):
|
36 |
query_words = set(arabic_word_tokenize(query))
|
37 |
overlaps = []
|