Skip to content

Commit

Permalink
Debug
Browse files Browse the repository at this point in the history
  • Loading branch information
zachgk committed Apr 22, 2024
1 parent 071d920 commit 49501d6
Show file tree
Hide file tree
Showing 3 changed files with 13 additions and 12 deletions.
2 changes: 1 addition & 1 deletion .github/workflows/benchmark-nightly.yml
Original file line number Diff line number Diff line change
Expand Up @@ -14,6 +14,6 @@ jobs:
uses: ./.github/workflows/instant_benchmark.yml
secrets: inherit
with:
running_template: tests/benchmark/nightly/g5-2xl.txt
running_template: ./benchmark/nightly/g5-2xl.txt
instance: g5.2xlarge
record: cloudwatch
18 changes: 9 additions & 9 deletions .github/workflows/instant_benchmark.yml
Original file line number Diff line number Diff line change
Expand Up @@ -71,12 +71,12 @@ jobs:
https://api.github.com/repos/deepjavalibrary/djl-serving/actions/runners/registration-token \
--fail \
| jq '.token' | tr -d '"' )
./start_instance.sh action_ib_${{ github.event.inputs.instance }} $token djl-serving
./start_instance.sh action_ib_${{ inputs.instance }} $token djl-serving
outputs:
gpu_instance_id: ${{ steps.create_instance.outputs.action_ib_instance_id }}

environment-setup:
runs-on: [ self-hosted, "${{ github.event.inputs.instance }}" ]
runs-on: [ self-hosted, "${{ inputs.instance }}" ]
timeout-minutes: 15
needs: [ create-runners ]
steps:
Expand All @@ -102,14 +102,14 @@ jobs:
working-directory: tests/integration
id: generate_matrix
run: |
python3 instant_benchmark.py --parse ${{ github.event.inputs.running_template }} \
--container "${{ github.event.inputs.container }}"
python3 instant_benchmark.py --parse ${{ inputs.running_template }} \
--container "${{ inputs.container }}"
outputs:
jobs: ${{ steps.generate_matrix.outputs.jobs }}
template: ${{ steps.generate_matrix.outputs.template }}

benchmark_run:
runs-on: [ self-hosted, "${{ github.event.inputs.instance }}" ]
runs-on: [ self-hosted, "${{ inputs.instance }}" ]
timeout-minutes: 30
needs: [ environment-setup ]
strategy:
Expand All @@ -136,7 +136,7 @@ jobs:
run: |
echo "${{ needs.environment-setup.outputs.template }}" >> template.json
python3 instant_benchmark.py --template template.json \
--job ${{ matrix.job }} --instance ${{ github.event.inputs.instance }}
--job ${{ matrix.job }} --instance ${{ inputs.instance }}
bash instant_benchmark.sh
- name: Configure AWS Credentials
Expand All @@ -145,12 +145,12 @@ jobs:
role-to-assume: arn:aws:iam::185921645874:role/github-actions-djl-serving
aws-region: us-east-1
- name: Record benchmark job
if: ${{ github.event.inputs.record == 'table' || github.event.inputs.record == 'cloudwatch' }}
if: ${{ inputs.record == 'table' || inputs.record == 'cloudwatch' }}
working-directory: tests/integration
run: |
python3 record_benchmark.py --template template.json \
--job ${{ matrix.job }} --instance ${{ github.event.inputs.instance }} \
--model models/test --record ${{ github.event.inputs.record }}
--job ${{ matrix.job }} --instance ${{ inputs.instance }} \
--model models/test --record ${{ inputs.record }}
- name: Get serving logs
if: always()
working-directory: tests/integration
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -7,9 +7,10 @@ CONCURRENCY={1,16,32}
[serving_properties]
engine=Python
option.rolling_batch=vllm
option.model_id=mistralai/Mistral-7B-v0.1
option.model_id=NousResearch/Hermes-2-Pro-Mistral-7B
option.tensor_parallel_degree=max
[aws_curl]
TOKENIZER=mistralai/Mistral-7B-v0.1 ./awscurl -c $CONCURRENCY -N 10 \
TOKENIZER=NousResearch/Hermes-2-Pro-Mistral-7B ./awscurl -c $CONCURRENCY -N 10 \
-X POST http://127.0.0.1:8080/invocations \
--connect-timeout 60 -H "Content-type: application/json" \
-d '{"inputs":"The new movie that got Oscar this year","parameters":{"max_new_tokens":256, "do_sample":true}}' \
Expand Down

0 comments on commit 49501d6

Please sign in to comment.