initial commit

This commit is contained in:
Daniel Graña 2024-05-20 21:28:10 -03:00
commit 0066470e85
2 changed files with 29 additions and 0 deletions

25
fly.toml Normal file
View File

@ -0,0 +1,25 @@
app = "vllm-demo"
primary_region = "ord"
[experimental]
entrypoint = "/start.sh"
[build]
image = "vllm/vllm-openai:v0.4.2"
[[mounts]]
source = "models"
destination = "/root/.cache/huggingface"
[http_service]
internal_port = 8000
force_https = true
[[vm]]
size = 'l40s'
gpus = 1
[[files]]
guest_path = "/start.sh"
local_path = "start.sh"

4
start.sh Normal file
View File

@ -0,0 +1,4 @@
#!/bin/sh
set -ex
ldconfig
exec python3 -m vllm.entrypoints.openai.api_server