diff --git a/ChatQnA/docker/xeon/README.md b/ChatQnA/docker/xeon/README.md index 8be8828a5..b6c1fe3a4 100644 --- a/ChatQnA/docker/xeon/README.md +++ b/ChatQnA/docker/xeon/README.md @@ -303,7 +303,7 @@ curl http://${host_ip}:9009/generate \ ```bash # vLLM Service -curl http://${your_ip}:9009/v1/completions \ +curl http://${host_ip}:9009/v1/completions \ -H "Content-Type: application/json" \ -d '{"model": "Intel/neural-chat-7b-v3-3", "prompt": "What is Deep Learning?", "max_tokens": 32, "temperature": 0}' ```