Ahmed007 commited on
Commit
ce69476
·
verified ·
1 Parent(s): 7ec63cb

Update main.py

Browse files
Files changed (1) hide show
  1. main.py +5 -4
main.py CHANGED
@@ -1,7 +1,6 @@
1
  from flask import Flask, request, jsonify
2
  from langchain_community.llms import LlamaCpp
3
-
4
-
5
  app = Flask(__name__)
6
 
7
  n_gpu_layers = 0
@@ -13,9 +12,11 @@ llm = LlamaCpp(
13
  temperature=0.1,
14
  n_gpu_layers=n_gpu_layers,
15
  n_batch=n_batch,
16
- verbose=True,
17
- n_ctx=2048
18
  )
 
 
 
19
 
20
  @app.route('/', methods=['POST'])
21
  def get_skills():
 
1
  from flask import Flask, request, jsonify
2
  from langchain_community.llms import LlamaCpp
3
+ import os
 
4
  app = Flask(__name__)
5
 
6
  n_gpu_layers = 0
 
12
  temperature=0.1,
13
  n_gpu_layers=n_gpu_layers,
14
  n_batch=n_batch,
15
+ n_ctx=4096
 
16
  )
17
+ file_size = os.stat('Phi-3-mini-4k-instruct-q4.gguf')
18
+ print("model size ====> :", file_size.st_size, "bytes")
19
+
20
 
21
  @app.route('/', methods=['POST'])
22
  def get_skills():