Spaces:

bstraehle
/

grady

Running

bstraehle commited on May 6

Commit

193c7ed

verified ·

1 Parent(s): 3d3e0e3

Update util.py

Files changed (1) hide show

util.py CHANGED Viewed

@@ -1,6 +1,7 @@
 import os
 import pandas as pd
 from docx import Document
 def get_questions(file_path, level):
     df = pd.read_json(file_path, lines=True)
@@ -38,4 +39,20 @@ def read_docx(file_path):
     for para in doc.paragraphs:
         text.append(para.text)
-    return "\n".join(text)

 import os
 import pandas as pd
 from docx import Document
+from pptx import Presentation
 def get_questions(file_path, level):
     df = pd.read_json(file_path, lines=True)
     for para in doc.paragraphs:
         text.append(para.text)
+    return "\n".join(text)
+def read_pptx(file_path):
+    prs = Presentation(file_path)
+    text = []
+    for slide in prs.slides:
+        slide_text = []
+        for shape in slide.shapes:
+            if hasattr(shape, "text"):
+                slide_text.append(shape.text)
+        text.append("\n".join(slide_text))
+    return "\n\n".join(text)