Skip to content

Commit

Permalink
[README] Update README.md. (#435)
Browse files Browse the repository at this point in the history
  • Loading branch information
Duyi-Wang authored Jun 5, 2024
1 parent 669bd66 commit f2bb303
Show file tree
Hide file tree
Showing 3 changed files with 6 additions and 6 deletions.
4 changes: 2 additions & 2 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -337,8 +337,8 @@ pip install vllm-xft
export $(python -c 'import xfastertransformer as xft; print(xft.get_env())')
python -m vllm.entrypoints.openai.api_server \
--model ${XFT_MODEL} \
--tokenizer ${TOKENIZER_DIR} \
--model ${MODEL_PATH} \
--tokenizer ${TOKEN_PATH} \
--dtype bf16 \
--kv-cache-dtype fp16 \
--served-model-name xft \
Expand Down
4 changes: 2 additions & 2 deletions README_CN.md
Original file line number Diff line number Diff line change
Expand Up @@ -340,8 +340,8 @@ pip install vllm-xft
export $(python -c 'import xfastertransformer as xft; print(xft.get_env())')
python -m vllm.entrypoints.openai.api_server \
--model ${XFT_MODEL} \
--tokenizer ${TOKENIZER_DIR} \
--model ${MODEL_PATH} \
--tokenizer ${TOKEN_PATH} \
--dtype bf16 \
--kv-cache-dtype fp16 \
--served-model-name xft \
Expand Down
4 changes: 2 additions & 2 deletions serving/vllm-xft.md
Original file line number Diff line number Diff line change
Expand Up @@ -15,8 +15,8 @@ pip install vllm-xft
export $(python -c 'import xfastertransformer as xft; print(xft.get_env())')

python -m vllm.entrypoints.openai.api_server \
--model ${XFT_MODEL} \
--tokenizer ${TOKENIZER_DIR} \
--model ${MODEL_PATH} \
--tokenizer ${TOKEN_PATH} \
--dtype bf16 \
--kv-cache-dtype fp16 \
--served-model-name xft \
Expand Down

0 comments on commit f2bb303

Please sign in to comment.