Skip to content

Commit

Permalink
[ci] Change trtllm correctness testing to llama3-8b
Browse files Browse the repository at this point in the history
  • Loading branch information
xyang16 committed Jul 31, 2024
1 parent 5154298 commit bbbbe49
Show file tree
Hide file tree
Showing 3 changed files with 7 additions and 7 deletions.
2 changes: 1 addition & 1 deletion tests/integration/llm/client.py
Original file line number Diff line number Diff line change
Expand Up @@ -739,7 +739,7 @@ def get_model_name():
"return_full_text": True
}
},
"trtllm-llama3-1-8b": {
"trtllm-llama3-8b": {
"batch_size": [213],
"seq_length": [1],
"num_run": 66,
Expand Down
4 changes: 2 additions & 2 deletions tests/integration/llm/prepare.py
Original file line number Diff line number Diff line change
Expand Up @@ -939,10 +939,10 @@
"option.max_rolling_batch_size": 41,
"option.model_loading_timeout": 1800
},
"trtllm-llama3-1-8b": {
"trtllm-llama3-8b": {
"engine": "Python",
"option.task": "text-generation",
"option.model_id": "s3://djl-llm/llama-3.1-8b-hf/",
"option.model_id": "s3://djl-llm/llama-3-8b-hf/",
"option.rolling_batch": "trtllm",
"option.tensor_parallel_degree": 4,
"option.max_rolling_batch_size": 213
Expand Down
8 changes: 4 additions & 4 deletions tests/integration/tests.py
Original file line number Diff line number Diff line change
Expand Up @@ -849,11 +849,11 @@ def test_codestral_22b(self):
r.launch("CUDA_VISIBLE_DEVICES=0,1,2,3")
client.run("correctness trtllm-codestral-22b".split())

def test_llama3_1_8b(self):
with Runner('tensorrt-llm', 'llama3-1-8b') as r:
prepare.build_correctness_model("trtllm-llama3-1-8b")
def test_llama3_8b(self):
with Runner('tensorrt-llm', 'llama3-8b') as r:
prepare.build_correctness_model("trtllm-llama3-8b")
r.launch("CUDA_VISIBLE_DEVICES=0,1,2,3")
client.run("correctness trtllm-llama3-1-8b".split())
client.run("correctness trtllm-llama3-8b".split())


@pytest.mark.correctness
Expand Down

0 comments on commit bbbbe49

Please sign in to comment.