8000 -> 52415 (#915)

* 8000 -> 52415

* dont grab the api port for placement

---------

Co-authored-by: rltakashige <rl.takashige@gmail.com>
This commit is contained in:
Evan Quiney
2025-12-18 18:39:44 +00:00
committed by GitHub
parent 5bd39e84d9
commit 9815283a82
9 changed files with 16 additions and 14 deletions

View File

@@ -7,7 +7,7 @@ import requests
def stream_chat(host: str, query: str) -> None:
url = f"http://{host}:8000/v1/chat/completions"
url = f"http://{host}:52415/v1/chat/completions"
headers = {"Content-Type": "application/json"}
payload = {
"model": "mlx-community/Llama-3.2-1B-Instruct-4bit",

View File

@@ -10,7 +10,7 @@ HOST="$1"
shift
QUERY="$*"
curl -sN -X POST "http://$HOST:8000/v1/chat/completions" \
curl -sN -X POST "http://$HOST:52415/v1/chat/completions" \
-H "Content-Type: application/json" \
-d "{
\"model\": \"mlx-community/Kimi-K2-Thinking\",