Spaces:

ShubhamD95
/

Gemma

Sleeping

App Files Files Community

ShubhamD95 commited on Jun 6

Commit

6e31e76

verified ·

1 Parent(s): 286e0a1

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -37

app.py CHANGED Viewed

@@ -5,24 +5,22 @@ import os
 from huggingface_hub import login
 import spacy
-# ✅ Authenticate using HF token stored in secret
 login(token=os.environ.get("HUGGINGFACEHUB_API_TOKEN"))
-# ✅ Load summarization model (lightweight and CPU-friendly)
 summarizer = pipeline("text2text-generation", model="declare-lab/flan-alpaca-base")
-# ✅ Load SpaCy English model for NLP keyword extraction
 nlp = spacy.load("en_core_web_sm")
-# ✅ Extract keywords (nouns & proper nouns, excluding stopwords)
 def extract_relevant_keywords(text):
     doc = nlp(text.lower())
     return set(
-        token.text for token in doc
         if token.pos_ in {"NOUN", "PROPN"} and not token.is_stop and len(token.text) > 2
     )
-# ✅ Match resume keywords with job description
 def compare_keywords(resume_text, job_desc):
     resume_words = extract_relevant_keywords(resume_text)
     job_words = extract_relevant_keywords(job_desc)
@@ -30,46 +28,45 @@ def compare_keywords(resume_text, job_desc):
     missing = job_words - resume_words
     return matched, missing
-# ✅ Highlight matched keywords in resume text
 def highlight_keywords(resume_text, matched):
     highlighted = resume_text
     for word in sorted(matched, key=len, reverse=True):
         highlighted = re.sub(rf"\b({re.escape(word)})\b", r"**\1**", highlighted, flags=re.IGNORECASE)
     return highlighted
-# ✅ Use LLM to extract contextually missing skills/tools
 def extract_missing_keywords_with_llm(job_desc, resume_text):
     prompt = f"""
 Given the following job description and resume, list the important skills, tools, and concepts from the job description that are missing or weakly represented in the resume.
 Job Description:
 {job_desc}
 Resume:
 {resume_text}
-Only list the missing keywords as bullet points.
 """
-    result = summarizer(prompt, max_new_tokens=300, do_sample=True)[0]
-    return result.get('generated_text', str(result)).strip()
-# ✅ Build LLM prompt to extract resume sections + insights
 def build_dynamic_prompt(job_desc, resume_text, analyze_with_jd):
     prompt = f"""
-You are a professional resume analyst.
-Classify the content of the resume below into logical sections such as:
-- Education
-- Work Experience
 - Technical Skills
 - Soft Skills
 - Certifications
-- Projects
-- Achievements
-Use markdown format with headers (###) for each section.
-If a job description is also provided, add relevant suggestions under each section to improve alignment with the job.
 Job Description:
 {job_desc if analyze_with_jd else '[None provided]'}
@@ -77,29 +74,27 @@ Job Description:
 Resume:
 {resume_text}
-Return your output in structured markdown format.
 """
     return prompt
-# ✅ Generate structured LLM output + keyword analysis
 def analyze_resume(job_desc, resume_text, analyze_with_jd):
     if not resume_text.strip():
         return "⚠️ Please paste your resume text."
-    prompt = build_dynamic_prompt(job_desc, resume_text, analyze_with_jd)
     try:
-        llm_result = summarizer(prompt, max_new_tokens=512, do_sample=True)[0]
-        structured_response = llm_result.get('generated_text', str(llm_result)).strip()
-        # Perform keyword comparison and highlighting
         if analyze_with_jd and job_desc:
             matched, missing = compare_keywords(resume_text, job_desc)
             highlighted_resume = highlight_keywords(resume_text, matched)
             llm_missing_keywords = extract_missing_keywords_with_llm(job_desc, resume_text)
-            return f"""
-### 🔍 Resume with Highlighted Matches
 {highlighted_resume}
@@ -116,14 +111,12 @@ def analyze_resume(job_desc, resume_text, analyze_with_jd):
 ---
-{structured_response}
-"""
-        return structured_response
     except Exception as e:
         return f"❌ Error: {str(e)}"
-# ✅ Gradio UI
 def create_ui():
     with gr.Blocks() as demo:
         with gr.Row():
@@ -141,3 +134,4 @@ def create_ui():
 if __name__ == '__main__':
     create_ui().launch()

 from huggingface_hub import login
 import spacy
+# Authenticate with Hugging Face token
 login(token=os.environ.get("HUGGINGFACEHUB_API_TOKEN"))
+# Load models
 summarizer = pipeline("text2text-generation", model="declare-lab/flan-alpaca-base")
 nlp = spacy.load("en_core_web_sm")
+# Extract contextually relevant keywords using spaCy
 def extract_relevant_keywords(text):
     doc = nlp(text.lower())
     return set(
+        token.lemma_ for token in doc
         if token.pos_ in {"NOUN", "PROPN"} and not token.is_stop and len(token.text) > 2
     )
+# Compare resume and JD for keyword matches
 def compare_keywords(resume_text, job_desc):
     resume_words = extract_relevant_keywords(resume_text)
     job_words = extract_relevant_keywords(job_desc)
     missing = job_words - resume_words
     return matched, missing
+# Highlight matched words in resume text
 def highlight_keywords(resume_text, matched):
     highlighted = resume_text
     for word in sorted(matched, key=len, reverse=True):
         highlighted = re.sub(rf"\b({re.escape(word)})\b", r"**\1**", highlighted, flags=re.IGNORECASE)
     return highlighted
+# LLM-based keyword extraction from JD
 def extract_missing_keywords_with_llm(job_desc, resume_text):
     prompt = f"""
 Given the following job description and resume, list the important skills, tools, and concepts from the job description that are missing or weakly represented in the resume.
+Only list the missing keywords as bullet points.
 Job Description:
 {job_desc}
 Resume:
 {resume_text}
 """
+    result = summarizer(prompt, max_new_tokens=300, do_sample=False)[0]
+    raw_text = result.get('generated_text', result.get('summary_text', str(result))).strip()
+    # Clean and deduplicate
+    lines = re.findall(r"-\s*(.+)", raw_text)
+    cleaned = list({kw.strip().lower() for kw in lines if len(kw.strip()) > 2})
+    return ', '.join(sorted(cleaned)) or "None"
+# Prompt builder for structured LLM resume analysis
 def build_dynamic_prompt(job_desc, resume_text, analyze_with_jd):
     prompt = f"""
+Act as a resume evaluator. Break the following resume into meaningful sections such as:
 - Technical Skills
 - Soft Skills
+- Education
+- Experience
 - Certifications
+- Projects (if present)
+Then, if a job description is provided, highlight what improvements are needed in each section to better align with the job role.
 Job Description:
 {job_desc if analyze_with_jd else '[None provided]'}
 Resume:
 {resume_text}
+Output your response in markdown format with section headings.
 """
     return prompt
+# Core analysis function
 def analyze_resume(job_desc, resume_text, analyze_with_jd):
     if not resume_text.strip():
         return "⚠️ Please paste your resume text."
+    user_prompt = build_dynamic_prompt(job_desc, resume_text, analyze_with_jd)
     try:
+        result = summarizer(user_prompt, max_new_tokens=512, do_sample=False)[0]
+        response_text = result.get('generated_text', result.get('summary_text', str(result))).strip()
         if analyze_with_jd and job_desc:
             matched, missing = compare_keywords(resume_text, job_desc)
             highlighted_resume = highlight_keywords(resume_text, matched)
             llm_missing_keywords = extract_missing_keywords_with_llm(job_desc, resume_text)
+            return f"""### 🔍 Resume with Highlighted Matches
 {highlighted_resume}
 ---
+{response_text}"""
+        return response_text
     except Exception as e:
         return f"❌ Error: {str(e)}"
+# Gradio interface
 def create_ui():
     with gr.Blocks() as demo:
         with gr.Row():
 if __name__ == '__main__':
     create_ui().launch()