Spaces:
Build error
Build error
added tokenization
Browse files
app.py
CHANGED
@@ -84,7 +84,7 @@ def get_documents(document_text, crawl=crawl_urls):
|
|
84 |
|
85 |
if tokenizing == "Don't (use entire body as document)":
|
86 |
document_paragraphs = [body]
|
87 |
-
elif tokenizing == 'Newline (split by
|
88 |
document_paragraphs = [n for n in body.split('\n') if len(n) > 50]
|
89 |
|
90 |
for document_paragraph in document_paragraphs:
|
|
|
84 |
|
85 |
if tokenizing == "Don't (use entire body as document)":
|
86 |
document_paragraphs = [body]
|
87 |
+
elif tokenizing == 'Newline (split by newline character)':
|
88 |
document_paragraphs = [n for n in body.split('\n') if len(n) > 50]
|
89 |
|
90 |
for document_paragraph in document_paragraphs:
|