Spaces:

cdcvd
/

Evalution_resume

Running

App Files Files Community

cdcvd commited on Sep 1

Commit

24f2b6a

•

1 Parent(s): 38d6941

Update models.py

Browse files

Files changed (1) hide show

models.py +57 -0

models.py CHANGED Viewed

@@ -84,6 +84,63 @@ def evaluate_with_gemma(pdf_file, job_description):
     outputs = gemma_pipe(prompt, max_new_tokens=256)
     return outputs[0]["generated_text"].strip()
 def evaluate_with_bloom(pdf_file, job_description):
     resume_text = extract_text_from_pdf(pdf_file)

     outputs = gemma_pipe(prompt, max_new_tokens=256)
     return outputs[0]["generated_text"].strip()
+from transformers import AutoModelForCausalLM, AutoTokenizer
+import torch
+def evaluate_with_qwen(resume_text, job_description):
+    # بارگذاری مدل و توکنایزر
+    model = AutoModelForCausalLM.from_pretrained(
+        "Qwen/Qwen2-72B-Instruct",
+        torch_dtype="auto",
+        device_map="auto"
+    ).to("cuda" if torch.cuda.is_available() else "cpu")
+    tokenizer = AutoTokenizer.from_pretrained("Qwen/Qwen2-72B-Instruct")
+    # تعریف پرامپت
+    prompt = f"""
+    من یک مسءول استخدام هستم و میخوام درصد تطابق رزومه فرد با شرح شغلی را
+    برای من محاسبه کنی لطفا درصد تطابق بین رزومه و شرح شغلی را بدست بیار. لطفا دقیق این درصد را محاسبه کن.
+    میخوام خودت به عنوان یک مدل زبانی درصد تطابق را برای من محاسبه کنی.
+    شرح شغل: {job_description}
+    رزومه: {resume_text}
+    """
+    # آماده‌سازی پیام برای مدل
+    messages = [
+        {"role": "system", "content": "You are a helpful assistant."},
+        {"role": "user", "content": prompt}
+    ]
+    text = tokenizer.apply_chat_template(
+        messages,
+        tokenize=False,
+        add_generation_prompt=True
+    )
+    model_inputs = tokenizer([text], return_tensors="pt").to("cuda" if torch.cuda.is_available() else "cpu")
+    # تولید پاسخ
+    generated_ids = model.generate(
+        model_inputs.input_ids,
+        max_new_tokens=512
+    )
+    # حذف توکن‌های ورودی از پاسخ تولید شده
+    generated_ids = [
+        output_ids[len(input_ids):] for input_ids, output_ids in zip(model_inputs.input_ids, generated_ids)
+    ]
+    # تبدیل پاسخ به متن
+    response = tokenizer.batch_decode(generated_ids, skip_special_tokens=True)[0]
+    return response
 def evaluate_with_bloom(pdf_file, job_description):
     resume_text = extract_text_from_pdf(pdf_file)