resume-roaster

Running

App Files Files Community

resume-roaster / tools /resumescraper.py

Kuberwastaken

Made it look better :)

f7933a5 about 1 month ago

raw

history blame contribute delete

2.22 kB

	from smolagents.tools import Tool

	class ResumeScraperTool(Tool):
	name = "resume_scraper"
	description = (
	"Parses a resume (in plain text) to extract key sections such as Summary, "
	"Experience, Education, and Skills. This tool expects the resume text to include "
	"section headers like 'Summary:', 'Experience:', 'Education:', and 'Skills:'."
	)
	inputs = {
	"resume_text": {
	"type": "string",
	"description": "The plain text of the resume"
	}
	}
	output_type = "object"

	def forward(self, resume_text: str) -> dict:
	# Basic extraction using simple markers; in a real-world case, you might want to use NLP.
	sections = {
	"summary": "Summary not found",
	"experience": "Experience not found",
	"education": "Education not found",
	"skills": "Skills not found"
	}
	lower_text = resume_text.lower()

	if "summary:" in lower_text:
	start = lower_text.index("summary:")
	# Assume the section ends at the next double newline or end of text
	end = lower_text.find("\n\n", start)
	sections["summary"] = resume_text[start + len("summary:"): end].strip() if end != -1 else resume_text[start + len("summary:"):].strip()

	if "experience:" in lower_text:
	start = lower_text.index("experience:")
	end = lower_text.find("\n\n", start)
	sections["experience"] = resume_text[start + len("experience:"): end].strip() if end != -1 else resume_text[start + len("experience:"):].strip()

	if "education:" in lower_text:
	start = lower_text.index("education:")
	end = lower_text.find("\n\n", start)
	sections["education"] = resume_text[start + len("education:"): end].strip() if end != -1 else resume_text[start + len("education:"):].strip()

	if "skills:" in lower_text:
	start = lower_text.index("skills:")
	end = lower_text.find("\n\n", start)
	sections["skills"] = resume_text[start + len("skills:"): end].strip() if end != -1 else resume_text[start + len("skills:"):].strip()

	return sections