Spaces:
Running
on
T4
Running
on
T4
Update ppt_chunker.py
Browse files- ppt_chunker.py +2 -2
ppt_chunker.py
CHANGED
@@ -65,10 +65,10 @@ def ppt_chunk(file_like, model):
|
|
65 |
list_items = list_items - duplicate
|
66 |
|
67 |
current_chunk.append("\n".join(list_items))
|
68 |
-
list_items
|
69 |
|
70 |
chunks.append([elem.id, current_chunk])
|
71 |
-
current_chunk
|
72 |
print(f'NEW CHUNK: {chunks[-1]}')
|
73 |
else:
|
74 |
if elem.text[-1] in NON_ENDING_PUNCT:
|
|
|
65 |
list_items = list_items - duplicate
|
66 |
|
67 |
current_chunk.append("\n".join(list_items))
|
68 |
+
list_items = set()
|
69 |
|
70 |
chunks.append([elem.id, current_chunk])
|
71 |
+
current_chunk = []
|
72 |
print(f'NEW CHUNK: {chunks[-1]}')
|
73 |
else:
|
74 |
if elem.text[-1] in NON_ENDING_PUNCT:
|