-
Notifications
You must be signed in to change notification settings - Fork 30
/
cog.yaml
32 lines (25 loc) · 1.02 KB
/
cog.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
# Configuration for Cog ⚙️
# Reference: https://github.com/replicate/cog/blob/main/docs/yaml.md
build:
# set to true if your model requires a GPU
gpu: true
cuda: "11.7"
# python version in the form '3.8' or '3.8.12'
python_version: "3.8"
# a list of packages in the format <package-name>==<version>
python_packages:
- "numpy==1.24.2"
- "torch==2.0.0"
- "accelerate==0.18.0"
- "peft==0.2.0"
- "sentencepiece==0.1.97"
- "tensorizer==1.0.1"
- "jinja2==3.1.2"
- "deepspeed==0.8.3"
run:
- "pip install git+https://github.com/huggingface/transformers.git@786092a35e18154cacad62c30fe92bac2c27a1e1"
- "mkdir /gc && cd /gc && curl -O https://dl.google.com/dl/cloudsdk/channels/rapid/downloads/google-cloud-cli-426.0.0-linux-x86_64.tar.gz && tar -xf google-cloud-cli-426.0.0-linux-x86_64.tar.gz && ./google-cloud-sdk/install.sh -q"
- "pip install google-cloud-storage"
# predict.py defines how predictions are run on your model
predict: "predict.py:Predictor"
train: "train.py:train"