Skip to content

Commit

Permalink
Update dynamic_quantize_gpu_test.cpp
Browse files Browse the repository at this point in the history
  • Loading branch information
p-durandin authored Jan 14, 2025
1 parent 9110cb5 commit beee18c
Showing 1 changed file with 1 addition and 1 deletion.
Original file line number Diff line number Diff line change
Expand Up @@ -294,9 +294,9 @@ TEST_F(dynamic_quantization_gpu_tests, simple_quantizing_kv_cache_reordered_asym
TEST_F(dynamic_quantization_gpu_tests, simple_quantizing_kv_cache_batched_reordered_asym_planar_i8_zp) {
this->test_dynamic_quantization(false, {-1, -1, 4, 64}, {1, 35, 4, 64}, QuantizationType::Asymmetric, UINT64_MAX,
data_types::i8, data_types::i8, OutputStorageType::Planar, "dynamic_quantize_gpu_kv_cache");
}

TEST_F(dynamic_quantization_gpu_tests, simple_quantizing_kv_cache_inner_most_dim_zero_values_asym) {
this->test_dynamic_quantization(false, {-1, 8, -1, 128}, {1, 8, 52, 128}, QuantizationType::Asymmetric, UINT64_MAX,
data_types::i8, data_types::f16, OutputStorageType::InterleavedScalesZP, "dynamic_quantize_gpu_kv_cache", true);

}

0 comments on commit beee18c

Please sign in to comment.