We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 7c01955 commit 2f24a00Copy full SHA for 2f24a00
tests/e2e/multicard/test_quantization.py
@@ -27,7 +27,7 @@
27
28
def test_models_distributed_quantized_W8A8():
29
example_prompts = [
30
- "Hello, my name is",
+ "The president of the United States is",
31
]
32
max_tokens = 5
33
with VllmRunner(snapshot_download("neuralmagic/Qwen2.5-3B-quantized.w8a8"),
@@ -38,7 +38,7 @@ def test_models_distributed_quantized_W8A8():
38
vllm_output = vllm_model.generate_greedy(example_prompts, max_tokens)
39
40
golden_results = [
41
- 'Hello, my name is the head of state and',
+ 'The president of the United States is the head of state and',
42
43
44
for i in range(len(vllm_output)):
0 commit comments