- Run the controller
python3 -m serve.controller
- Run the model worker
python3 -m serve.model_worker --model-path $MODEL_PATH --port 21002 --worker-address=http://localhost:21002 --model-name=SelFee-13b
- Run the web server
python3 -m serve.gradio_web_server --share