Resume-EndPoint

Sleeping

Alexvatti commited on Apr 24

Commit

e0e3a7b

verified ·

1 Parent(s): cb07a78

Update main.py

Files changed (1) hide show

main.py CHANGED Viewed

@@ -64,6 +64,15 @@ async def save_file(file: UploadFile) -> str:
         await out_file.write(content)
     return file_path
 # ✅ Extract text from PDF using PyPDF2
 def extract_text_from_pdf(pdf_path: str) -> str:
     text = ""
@@ -86,11 +95,16 @@ async def parse_resume(file: UploadFile = File(...)):
         print(f"✅ File saved at {path}")
         print("📄 Extracting text...")
-        text = extract_text_from_pdf(path)
-        print("✅ Text extracted.")
-        json_result = parse_resume_text(text)
-        print("✅ JSON Created.")
         os.remove(path)
         print("🧹 File removed.")

         await out_file.write(content)
     return file_path
+# ✅ Extract text from DOCX
+def extract_text_from_docx(docx_path: str) -> str:
+    try:
+        doc = Document(docx_path)
+        text = "\n".join([para.text for para in doc.paragraphs])
+        return text.strip()
+    except Exception as e:
+        return f"Error extracting text from DOCX: {str(e)}"
 # ✅ Extract text from PDF using PyPDF2
 def extract_text_from_pdf(pdf_path: str) -> str:
     text = ""
         print(f"✅ File saved at {path}")
         print("📄 Extracting text...")
+        ext = os.path.splitext(path)[-1].lower()
+        if ext == ".pdf":
+            text = extract_text_from_pdf(path)
+        elif ext in [".docx", ".doc"]:
+            text = extract_text_from_docx(path)
+        else:
+            os.remove(path)
+            return JSONResponse(status_code=400, content={"error": "Unsupported file type"})
+        print("✅ Text extracted.")
         os.remove(path)
         print("🧹 File removed.")