Spaces:
Sleeping
Sleeping
Commit
·
9919b54
1
Parent(s):
7e6ffb4
update
Browse files
src/application/text/search_detection.py
CHANGED
|
@@ -189,14 +189,16 @@ def find_paragraph_source(text, text_index, sentences_df):
|
|
| 189 |
|
| 190 |
|
| 191 |
print(f"sen: {sentences_df}")
|
| 192 |
-
for
|
| 193 |
-
print(f"{
|
| 194 |
-
if
|
|
|
|
|
|
|
| 195 |
continue
|
| 196 |
|
| 197 |
# find content in new url
|
| 198 |
aligned_sentence = check_paraphrase(
|
| 199 |
-
text[
|
| 200 |
page_text,
|
| 201 |
url,
|
| 202 |
)
|
|
|
|
| 189 |
|
| 190 |
|
| 191 |
print(f"sen: {sentences_df}")
|
| 192 |
+
for idx, _ in enumerate(sentences_df):
|
| 193 |
+
print(f"{idx}")
|
| 194 |
+
if idx > len(sentences_df):
|
| 195 |
+
break
|
| 196 |
+
if sentences_df.loc[idx, "url"] is not None:
|
| 197 |
continue
|
| 198 |
|
| 199 |
# find content in new url
|
| 200 |
aligned_sentence = check_paraphrase(
|
| 201 |
+
text[idx],
|
| 202 |
page_text,
|
| 203 |
url,
|
| 204 |
)
|