Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
|
@@ -27,8 +27,11 @@ df3_questions = df3["question"].values
|
|
| 27 |
df3_links = df3["url"].values
|
| 28 |
|
| 29 |
def arabic_word_tokenize(text):
|
|
|
|
|
|
|
| 30 |
return re.findall(r'\w+', text)
|
| 31 |
|
|
|
|
| 32 |
def compute_word_overlap(query, questions):
|
| 33 |
query_words = set(arabic_word_tokenize(query))
|
| 34 |
overlaps = []
|
|
|
|
| 27 |
df3_links = df3["url"].values
|
| 28 |
|
| 29 |
def arabic_word_tokenize(text):
|
| 30 |
+
if not isinstance(text, str):
|
| 31 |
+
return []
|
| 32 |
return re.findall(r'\w+', text)
|
| 33 |
|
| 34 |
+
|
| 35 |
def compute_word_overlap(query, questions):
|
| 36 |
query_words = set(arabic_word_tokenize(query))
|
| 37 |
overlaps = []
|