Update app.py
Browse files
app.py
CHANGED
@@ -1,4 +1,13 @@
|
|
1 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
2 |
import argparse
|
3 |
import time
|
4 |
|
|
|
1 |
+
git clone https://huggingface.co/microsoft/Phi-3-mini-4k-instruct-onnx
|
2 |
+
git clone https://huggingface.co/microsoft/Phi-3-mini-128k-instruct-onnx
|
3 |
+
pip install numpy
|
4 |
+
pip install --pre onnxruntime-genai-directml
|
5 |
+
pip install numpy
|
6 |
+
pip install --pre onnxruntime-genai-cuda --index-url=https://aiinfra.pkgs.visualstudio.com/PublicPackages/_packaging/onnxruntime-genai/pypi/simple/
|
7 |
+
curl https://raw.githubusercontent.com/microsoft/onnxruntime-genai/main/examples/python/model-qa.py -o model-qa.py
|
8 |
+
python model-qa.py -m Phi-3-mini-128k-instruct-onnx/directml/directml-int4-awq-block-128 -l 2048
|
9 |
+
|
10 |
+
import onnxruntime_genai as og
|
11 |
import argparse
|
12 |
import time
|
13 |
|