diff --git a/vllm/inference.py b/vllm/inference.py index 28fa0ea..8cecec2 100644 --- a/vllm/inference.py +++ b/vllm/inference.py @@ -11,7 +11,7 @@ @function( image=Image().add_python_packages(["vllm"]), volumes=[vllm_cache], - gpu="A10G", + gpu="A100-40", memory="8Gi", cpu=1, ) diff --git a/vllm/yicoder.py b/vllm/yicoder.py index 1b7328a..b7d1e9c 100644 --- a/vllm/yicoder.py +++ b/vllm/yicoder.py @@ -25,7 +25,7 @@ @asgi( image=Image().add_python_packages(["vllm"]), volumes=[vllm_cache], - gpu="A10G", + gpu="A100-40", memory="8Gi", cpu=1, keep_warm_seconds=360,