Spaces:

Manojajj
/

dbmdz-bert-large-cased-finetuned

Sleeping

App Files Files Community

Manojajj commited on Nov 19, 2024

Commit

2543fdd

verified ·

1 Parent(s): 4df6b19

Update app.py

Browse files

Files changed (1) hide show

app.py +5 -24

app.py CHANGED Viewed

@@ -17,7 +17,7 @@ def extract_text_from_pdf(pdf_file):
     return text
 def parse_resume(resume_text):
-    """Parse the resume and extract details like name, email, phone, skills, etc."""
     # Define regex for phone and email extraction
     phone_pattern = r'\(?\d{3}\)?[-.\s]?\d{3}[-.\s]?\d{4}'
     email_pattern = r'[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\.[a-zA-Z]{2,}'
@@ -26,34 +26,15 @@ def parse_resume(resume_text):
     phone = re.findall(phone_pattern, resume_text)
     email = re.findall(email_pattern, resume_text)
-    # Extract named entities (e.g., skills, education, and experience)
     entities = nlp(resume_text)
-    # For simplicity, we just list out the entities here
-    skills = []
-    experience = []
-    education = []
-    certifications = []
-    # Iterate through recognized entities and categorize them
-    for entity in entities:
-        if 'ORG' in entity['entity']:
-            experience.append(entity['word'])
-        elif 'MISC' in entity['entity']:
-            skills.append(entity['word'])
-        elif 'LOC' in entity['entity']:
-            education.append(entity['word'])
-        else:
-            certifications.append(entity['word'])
-    # Create a dictionary of parsed data
     parsed_data = {
         "Phone": phone[0] if phone else "Not found",
         "Email": email[0] if email else "Not found",
         "Skills": ", ".join(skills),
-        "Experience": ", ".join(experience),
-        "Education": ", ".join(education),
-        "Certifications": ", ".join(certifications)
     }
     return parsed_data
@@ -83,5 +64,5 @@ gr.Interface(
     inputs=gr.File(file_count="multiple", label="Upload Resumes (PDFs)"),
     outputs=gr.File(label="Download Parsed Data (Excel)"),
     title="AI Resume Parser",
-    description="Upload multiple resumes (PDFs) to extract details like Name, Email, Phone, Skills, Experience, Education, and Certifications. The results will be saved in an Excel file."
 ).launch()

     return text
 def parse_resume(resume_text):
+    """Parse the resume and extract details like name, email, phone, and skills."""
     # Define regex for phone and email extraction
     phone_pattern = r'\(?\d{3}\)?[-.\s]?\d{3}[-.\s]?\d{4}'
     email_pattern = r'[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\.[a-zA-Z]{2,}'
     phone = re.findall(phone_pattern, resume_text)
     email = re.findall(email_pattern, resume_text)
+    # Extract named entities for skills
     entities = nlp(resume_text)
+    skills = [entity['word'] for entity in entities if 'MISC' in entity['entity']]
+    # Create a dictionary of parsed data (exclude Experience, Education, Certifications)
     parsed_data = {
         "Phone": phone[0] if phone else "Not found",
         "Email": email[0] if email else "Not found",
         "Skills": ", ".join(skills),
     }
     return parsed_data
     inputs=gr.File(file_count="multiple", label="Upload Resumes (PDFs)"),
     outputs=gr.File(label="Download Parsed Data (Excel)"),
     title="AI Resume Parser",
+    description="Upload multiple resumes (PDFs) to extract details like Name, Email, Phone, and Skills. The results will be saved in an Excel file."
 ).launch()