update vllm0.5.0

66dadd2d · zhuwenwen · cad75589 · 66dadd2d · 66dadd2d · 66dadd2d
Commit 66dadd2d authored Sep 29, 2024 by zhuwenwen
20 changed files
--- a/examples/offline_streaming_inference_chat_demo.py
+++ b/examples/offline_streaming_inference_chat_demo.py
--- a/examples/openai_chat_completion_client.py
+++ b/examples/openai_chat_completion_client.py
--- a/examples/openai_completion_client.py
+++ b/examples/openai_completion_client.py
--- a/examples/openai_embedding_client.py
+++ b/examples/openai_embedding_client.py
--- a/examples/openai_example_batch.jsonl
+++ b/examples/openai_example_batch.jsonl
+{"custom_id": "request-1", "method": "POST", "url": "/v1/chat/completions", "body": {"model": "meta-llama/Meta-Llama-3-8B-Instruct", "messages": [{"role": "system", "content": "You are a helpful assistant."},{"role": "user", "content": "Hello world!"}],"max_tokens": 1000}}
+{"custom_id": "request-2", "method": "POST", "url": "/v1/chat/completions", "body": {"model": "meta-llama/Meta-Llama-3-8B-Instruct", "messages": [{"role": "system", "content": "You are an unhelpful assistant."},{"role": "user", "content": "Hello world!"}],"max_tokens": 1000}}
--- a/examples/production_monitoring/README.md
+++ b/examples/production_monitoring/README.md
--- a/examples/production_monitoring/docker-compose.yaml
+++ b/examples/production_monitoring/docker-compose.yaml
--- a/examples/production_monitoring/grafana.json
+++ b/examples/production_monitoring/grafana.json
--- a/examples/production_monitoring/prometheus.yaml
+++ b/examples/production_monitoring/prometheus.yaml
+# prometheus.yaml
+global:
+  scrape_interval: 5s
+  evaluation_interval: 30s
+
+scrape_configs:
+  - job_name: vllm
+    static_configs:
+      - targets:
+          - 'host.docker.internal:8000'
--- a/examples/save_sharded_state.py
+++ b/examples/save_sharded_state.py
--- a/examples/template_alpaca.jinja
+++ b/examples/template_alpaca.jinja
--- a/examples/template_baichuan.jinja
+++ b/examples/template_baichuan.jinja
--- a/examples/template_chatglm.jinja
+++ b/examples/template_chatglm.jinja
--- a/examples/template_chatglm2.jinja
+++ b/examples/template_chatglm2.jinja
--- a/examples/template_chatml.jinja
+++ b/examples/template_chatml.jinja
--- a/examples/template_falcon.jinja
+++ b/examples/template_falcon.jinja
--- a/examples/template_falcon_180b.jinja
+++ b/examples/template_falcon_180b.jinja
--- a/examples/template_inkbot.jinja
+++ b/examples/template_inkbot.jinja
--- a/examples/template_llama_chat.jinja
+++ b/examples/template_llama_chat.jinja
--- a/examples/template_llava.jinja
+++ b/examples/template_llava.jinja