Skip to content

Commit

Permalink
TRTLLM ChatGLM CI
Browse files Browse the repository at this point in the history
  • Loading branch information
ydm-amazon committed Dec 21, 2023
1 parent 4d4d8c1 commit 8169eb8
Show file tree
Hide file tree
Showing 3 changed files with 25 additions and 1 deletion.
11 changes: 11 additions & 0 deletions .github/workflows/llm_integration.yml
Original file line number Diff line number Diff line change
Expand Up @@ -756,6 +756,17 @@ jobs:
python3 llm/client.py trtllm baichuan2-13b
rm -rf docker_env
docker rm -f $(docker ps -aq)
- name: chatglm3-6b HF model with tp=4
working-directory: tests/integration
run: |
rm -rf models
echo -en "CUDA_VISIBLE_DEVICES=0,1,2,3" > docker_env
python3 llm/prepare.py trtllm chatglm3-6b
./launch_container.sh deepjavalibrary/djl-serving:$DJLSERVING_DOCKER_TAG $PWD/models trtllm \
serve
python3 llm/client.py trtllm chatglm3-6b
rm -rf docker_env
docker rm -f $(docker ps -aq)
- name: On fail step
if: ${{ failure() }}
working-directory: tests/integration
Expand Down
8 changes: 7 additions & 1 deletion tests/integration/llm/client.py
Original file line number Diff line number Diff line change
Expand Up @@ -467,7 +467,13 @@ def get_model_name():
"batch_size": [1],
"seq_length": [64, 128, 256],
"stream_output": True,
}
},
"chatglm3-6b": {
"max_memory_per_gpu": [22.0],
"batch_size": [1],
"seq_length": [64, 128, 256],
"stream_output": True,
},
}

deepspeed_rolling_batch_model_spec = {
Expand Down
7 changes: 7 additions & 0 deletions tests/integration/llm/prepare.py
Original file line number Diff line number Diff line change
Expand Up @@ -702,6 +702,13 @@
"option.baichuan_model_version": "v2_13b",
"option.output_formatter": "jsonlines",
"option.trust_remote_code": True
},
"chatglm3-6b": {
"option.model_id": "THUDM/chatglm3-6b",
"option.tensor_parallel_degree": 4,
"option.output_formatter": "jsonlines",
"option.trust_remote_code": True,
"option.chatglm_model_version": "chatglm3_6b"
}
}

Expand Down

0 comments on commit 8169eb8

Please sign in to comment.