zayanomar5 commited on
Commit
7c86bd0
·
verified ·
1 Parent(s): 93885cf

Update main.py

Browse files
Files changed (1) hide show
  1. main.py +8 -9
main.py CHANGED
@@ -12,40 +12,39 @@ n_gpu_layers = 0
12
  n_batch = 1024
13
 
14
  llm = LlamaCpp(
15
- model_path="Phi-3-mini-4k-instruct-q4.gguf",
16
  temperature=0.1,
17
  n_gpu_layers=n_gpu_layers,
18
  n_batch=n_batch,
19
  verbose=True,
20
  n_ctx=4096
21
  )
 
22
 
23
- # Initializing sentence transformer model
24
  model = SentenceTransformer('sentence-transformers/paraphrase-TinyBERT-L6-v2')
25
 
26
  file_size = os.stat('Phi-3-mini-4k-instruct-q4.gguf')
27
- print("Model size: ", file_size.st_size, "bytes")
28
 
29
 
30
  @app.route('/cv', methods=['POST'])
31
  def get_skills():
32
  cv_body = request.json.get('cv_body')
33
 
 
34
  output = llm(
35
- f"\n{cv_body}\nCan you list the skills mentioned in the CV?",
36
- max_tokens=256,
37
- stop=[""],
38
- echo=True,
39
  )
40
 
41
  return jsonify({'skills': output})
42
 
43
-
44
  @app.get('/')
45
  def health():
46
  return jsonify({'status': 'Worked'})
47
 
48
-
49
  @app.route('/compare', methods=['POST'])
50
  def compare():
51
  employee_skills = request.json.get('employee_skills')
 
12
  n_batch = 1024
13
 
14
  llm = LlamaCpp(
15
+ model_path="Phi-3-mini-4k-instruct-q4.gguf", # path to GGUF file
16
  temperature=0.1,
17
  n_gpu_layers=n_gpu_layers,
18
  n_batch=n_batch,
19
  verbose=True,
20
  n_ctx=4096
21
  )
22
+ model0 = AutoModel.from_pretrained('sentence-transformers/paraphrase-TinyBERT-L6-v2')
23
 
 
24
  model = SentenceTransformer('sentence-transformers/paraphrase-TinyBERT-L6-v2')
25
 
26
  file_size = os.stat('Phi-3-mini-4k-instruct-q4.gguf')
27
+ print("model size ====> :", file_size.st_size, "bytes")
28
 
29
 
30
  @app.route('/cv', methods=['POST'])
31
  def get_skills():
32
  cv_body = request.json.get('cv_body')
33
 
34
+ # Simple inference example
35
  output = llm(
36
+ f"<|user|>\n{cv_body}<|end|>\n<|assistant|>Can you list the skills mentioned in the CV?<|end|>",
37
+ max_tokens=256, # Generate up to 256 tokens
38
+ stop=["<|end|>"],
39
+ echo=True, # Whether to echo the prompt
40
  )
41
 
42
  return jsonify({'skills': output})
43
 
 
44
  @app.get('/')
45
  def health():
46
  return jsonify({'status': 'Worked'})
47
 
 
48
  @app.route('/compare', methods=['POST'])
49
  def compare():
50
  employee_skills = request.json.get('employee_skills')