Spaces:
Sleeping
Sleeping
th8m0z
commited on
Commit
·
562d913
1
Parent(s):
f48c06b
no changes, test commit
Browse files- functions.py +0 -1
functions.py
CHANGED
@@ -37,7 +37,6 @@ def pdf_to_text(path, start_page=1, end_page=None):
|
|
37 |
|
38 |
# converts a text into a list of chunks
|
39 |
def text_to_chunks(texts, word_length=150, start_page=1, file_number=1):
|
40 |
-
|
41 |
filtered_texts = [''.join(char for char in text if ord(char) < 128) for text in texts]
|
42 |
text_toks = [t.split(' ') for t in filtered_texts]
|
43 |
chunks = []
|
|
|
37 |
|
38 |
# converts a text into a list of chunks
|
39 |
def text_to_chunks(texts, word_length=150, start_page=1, file_number=1):
|
|
|
40 |
filtered_texts = [''.join(char for char in text if ord(char) < 128) for text in texts]
|
41 |
text_toks = [t.split(' ') for t in filtered_texts]
|
42 |
chunks = []
|