mirror of
https://github.com/informaticker/vllm-fly.git
synced 2024-11-22 01:31:58 +01:00
initial commit
This commit is contained in:
commit
0066470e85
25
fly.toml
Normal file
25
fly.toml
Normal file
@ -0,0 +1,25 @@
|
||||
app = "vllm-demo"
|
||||
primary_region = "ord"
|
||||
|
||||
[experimental]
|
||||
entrypoint = "/start.sh"
|
||||
|
||||
[build]
|
||||
image = "vllm/vllm-openai:v0.4.2"
|
||||
|
||||
[[mounts]]
|
||||
source = "models"
|
||||
destination = "/root/.cache/huggingface"
|
||||
|
||||
[http_service]
|
||||
internal_port = 8000
|
||||
force_https = true
|
||||
|
||||
[[vm]]
|
||||
size = 'l40s'
|
||||
gpus = 1
|
||||
|
||||
[[files]]
|
||||
guest_path = "/start.sh"
|
||||
local_path = "start.sh"
|
||||
|
Loading…
Reference in New Issue
Block a user