File size: 290 Bytes
56b9716
 
 
 
 
3425837
 
56b9716
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
#!/bin/bash

python -m vllm.entrypoints.openai.api_server \
    --model moonshotai/Kimi-Dev-72B \
    --tensor-parallel-size 4 \
    --max-num-seqs 4 \
    --max-model-len 65536 \
    --gpu-memory-utilization 0.9 \
    --host localhost \
    --served-model-name kimi-dev \
    --port 8080