Spaces:
Sleeping
Sleeping
Update main.py
Browse files
main.py
CHANGED
@@ -12,40 +12,39 @@ n_gpu_layers = 0
|
|
12 |
n_batch = 1024
|
13 |
|
14 |
llm = LlamaCpp(
|
15 |
-
model_path="Phi-3-mini-4k-instruct-q4.gguf",
|
16 |
temperature=0.1,
|
17 |
n_gpu_layers=n_gpu_layers,
|
18 |
n_batch=n_batch,
|
19 |
verbose=True,
|
20 |
n_ctx=4096
|
21 |
)
|
|
|
22 |
|
23 |
-
# Initializing sentence transformer model
|
24 |
model = SentenceTransformer('sentence-transformers/paraphrase-TinyBERT-L6-v2')
|
25 |
|
26 |
file_size = os.stat('Phi-3-mini-4k-instruct-q4.gguf')
|
27 |
-
print("
|
28 |
|
29 |
|
30 |
@app.route('/cv', methods=['POST'])
|
31 |
def get_skills():
|
32 |
cv_body = request.json.get('cv_body')
|
33 |
|
|
|
34 |
output = llm(
|
35 |
-
f"
|
36 |
-
max_tokens=256,
|
37 |
-
stop=[""],
|
38 |
-
echo=True,
|
39 |
)
|
40 |
|
41 |
return jsonify({'skills': output})
|
42 |
|
43 |
-
|
44 |
@app.get('/')
|
45 |
def health():
|
46 |
return jsonify({'status': 'Worked'})
|
47 |
|
48 |
-
|
49 |
@app.route('/compare', methods=['POST'])
|
50 |
def compare():
|
51 |
employee_skills = request.json.get('employee_skills')
|
|
|
12 |
n_batch = 1024
|
13 |
|
14 |
llm = LlamaCpp(
|
15 |
+
model_path="Phi-3-mini-4k-instruct-q4.gguf", # path to GGUF file
|
16 |
temperature=0.1,
|
17 |
n_gpu_layers=n_gpu_layers,
|
18 |
n_batch=n_batch,
|
19 |
verbose=True,
|
20 |
n_ctx=4096
|
21 |
)
|
22 |
+
model0 = AutoModel.from_pretrained('sentence-transformers/paraphrase-TinyBERT-L6-v2')
|
23 |
|
|
|
24 |
model = SentenceTransformer('sentence-transformers/paraphrase-TinyBERT-L6-v2')
|
25 |
|
26 |
file_size = os.stat('Phi-3-mini-4k-instruct-q4.gguf')
|
27 |
+
print("model size ====> :", file_size.st_size, "bytes")
|
28 |
|
29 |
|
30 |
@app.route('/cv', methods=['POST'])
|
31 |
def get_skills():
|
32 |
cv_body = request.json.get('cv_body')
|
33 |
|
34 |
+
# Simple inference example
|
35 |
output = llm(
|
36 |
+
f"<|user|>\n{cv_body}<|end|>\n<|assistant|>Can you list the skills mentioned in the CV?<|end|>",
|
37 |
+
max_tokens=256, # Generate up to 256 tokens
|
38 |
+
stop=["<|end|>"],
|
39 |
+
echo=True, # Whether to echo the prompt
|
40 |
)
|
41 |
|
42 |
return jsonify({'skills': output})
|
43 |
|
|
|
44 |
@app.get('/')
|
45 |
def health():
|
46 |
return jsonify({'status': 'Worked'})
|
47 |
|
|
|
48 |
@app.route('/compare', methods=['POST'])
|
49 |
def compare():
|
50 |
employee_skills = request.json.get('employee_skills')
|