From 0073f43af8dbffa1013f4567784c9f034a21d145 Mon Sep 17 00:00:00 2001 From: elia <146715005+informaticker@users.noreply.github.com> Date: Thu, 3 Oct 2024 16:26:09 +0200 Subject: [PATCH] Update README.md --- README.md | 44 +------------------------------------------- 1 file changed, 1 insertion(+), 43 deletions(-) diff --git a/README.md b/README.md index 325f5d7..2c2e345 100644 --- a/README.md +++ b/README.md @@ -1,43 +1 @@ -# [vLLM](https://github.com/vllm-project/vllm) demo app for Fly.io - - -First deploy with: -``` -fly launch -``` - -from there update by running: `fly deploy` - -Once deploy, interact with the API at https://$APPNAME.fly.dev/ - - -``` -❯ curl https://vllm-demo.fly.dev/v1/completions \ - -H "Content-Type: application/json" \ - -d '{ - "model": "facebook/opt-125m", - "prompt": "San Francisco is a", - "max_tokens": 7, - "temperature": 0 - }' -s |jq . -{ - "id": "cmpl-b4b03ec33d794a50ba5cf2801d807025", - "object": "text_completion", - "created": 1716250075, - "model": "facebook/opt-125m", - "choices": [ - { - "index": 0, - "text": " great place to live. I", - "logprobs": null, - "finish_reason": "length", - "stop_reason": null - } - ], - "usage": { - "prompt_tokens": 5, - "total_tokens": 12, - "completion_tokens": 7 - } -} -``` +schmerzen