mirror of
https://github.com/informaticker/vllm-fly.git
synced 2024-11-22 01:31:58 +01:00
initial commit
This commit is contained in:
commit
0066470e85
25
fly.toml
Normal file
25
fly.toml
Normal file
@ -0,0 +1,25 @@
|
|||||||
|
app = "vllm-demo"
|
||||||
|
primary_region = "ord"
|
||||||
|
|
||||||
|
[experimental]
|
||||||
|
entrypoint = "/start.sh"
|
||||||
|
|
||||||
|
[build]
|
||||||
|
image = "vllm/vllm-openai:v0.4.2"
|
||||||
|
|
||||||
|
[[mounts]]
|
||||||
|
source = "models"
|
||||||
|
destination = "/root/.cache/huggingface"
|
||||||
|
|
||||||
|
[http_service]
|
||||||
|
internal_port = 8000
|
||||||
|
force_https = true
|
||||||
|
|
||||||
|
[[vm]]
|
||||||
|
size = 'l40s'
|
||||||
|
gpus = 1
|
||||||
|
|
||||||
|
[[files]]
|
||||||
|
guest_path = "/start.sh"
|
||||||
|
local_path = "start.sh"
|
||||||
|
|
Loading…
Reference in New Issue
Block a user