|
build: |
|
gpu: true |
|
cuda: "11.7" |
|
python_version: "3.10" |
|
python_requirements: requirements.txt |
|
|
|
|
|
run: |
|
- pip install flash-attn==0.2.8 |
|
- pip install triton==2.0.0.dev20221202 |
|
- pip install tensorizer==1.1.0 |
|
- echo 'deb [signed-by=/usr/share/keyrings/cloud.google.gpg] https://packages.cloud.google.com/apt cloud-sdk main' | tee -a /etc/apt/sources.list.d/google-cloud-sdk.list |
|
- curl https://packages.cloud.google.com/apt/doc/apt-key.gpg | apt-key --keyring /usr/share/keyrings/cloud.google.gpg add - |
|
- apt-get update && apt-get install google-cloud-cli |
|
predict: "predict.py:Predictor" |