Spaces:
Sleeping
Sleeping
import gradio as gr | |
import pdfplumber | |
import spacy | |
from spacy.cli import download | |
from sentence_transformers import SentenceTransformer, util | |
# Function to load the spaCy model, downloading it if necessary | |
def load_spacy_model(): | |
try: | |
nlp = spacy.load('en_core_web_md') | |
except OSError: | |
download('en_core_web_md') # Download the model if it is not found | |
nlp = spacy.load('en_core_web_md') # Load the model after downloading | |
return nlp | |
# Load spaCy model and Sentence Transformer model | |
nlp = load_spacy_model() | |
model = SentenceTransformer('all-MiniLM-L6-v2') | |
def extract_text_from_pdf(pdf_path): | |
text = '' | |
with pdfplumber.open(pdf_path) as pdf: | |
for page in pdf.pages: | |
text += page.extract_text() + "\n" # Add newline for better formatting | |
return text | |
def extract_text_from_txt(txt_path): | |
with open(txt_path, 'r') as file: | |
return file.read() | |
def analyze_resume(resume_file, job_description_file): | |
# Extract text from the PDF resume | |
resume_text = extract_text_from_pdf(resume_file.name) | |
# Extract text from the job description text file | |
job_description = extract_text_from_txt(job_description_file.name) | |
# Process the text with spaCy | |
doc = nlp(resume_text) | |
# Extract named entities from the resume | |
entities = [(ent.text, ent.label_) for ent in doc.ents] | |
# Get embeddings and compute similarity | |
resume_embedding = model.encode(resume_text) | |
job_description_embedding = model.encode(job_description) | |
# Calculate similarity and convert to percentage | |
similarity = util.pytorch_cos_sim(resume_embedding, job_description_embedding).item() * 100 | |
similarity = round(similarity, 2) # Round to two decimal places | |
return entities, f"{similarity}%", job_description | |
# Create a Gradio interface | |
iface = gr.Interface( | |
fn=analyze_resume, | |
inputs=[ | |
gr.File(label="Upload Resume (PDF)"), | |
gr.File(label="Upload Job Description (TXT)") | |
], | |
outputs=[ | |
gr.JSON(label="Extracted Entities"), | |
gr.Textbox(label="Resume and Job Description Similarity"), | |
gr.Textbox(label="Job Description Text", interactive=False) | |
], | |
title="Resume and Job Description Analyzer", | |
description="Upload your PDF resume and a TXT job description to extract entities and calculate similarity." | |
) | |
# Launch the interface | |
iface.launch() | |