Skip to content

Commit

Permalink
dev with scale factor = 8
Browse files Browse the repository at this point in the history
  • Loading branch information
e-ddykim committed Jan 11, 2025
1 parent ca1cf6f commit 95a301e
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions src/plugins/intel_gpu/src/runtime/execution_config.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -61,7 +61,7 @@ void ExecutionConfig::set_default() {
std::make_tuple(ov::hint::kv_cache_precision, ov::element::undefined),
std::make_tuple(ov::intel_gpu::hint::enable_kernels_reuse, false),
std::make_tuple(ov::weights_path, ""),
std::make_tuple(ov::hint::activations_scale_factor, -1.f),
std::make_tuple(ov::hint::activations_scale_factor, 8.f),

// Legacy API properties
std::make_tuple(ov::intel_gpu::nv12_two_inputs, false),
Expand Down Expand Up @@ -275,8 +275,8 @@ void ExecutionConfig::apply_user_properties(const cldnn::device_info& info) {
void ExecutionConfig::apply_rt_info(const cldnn::device_info& info, const ov::RTMap& rt_info) {
if (!info.supports_immad) {
apply_rt_info_property(ov::hint::kv_cache_precision, rt_info);
apply_rt_info_property(ov::hint::activations_scale_factor, rt_info);
}
apply_rt_info_property(ov::hint::activations_scale_factor, rt_info);
apply_rt_info_property(ov::hint::dynamic_quantization_group_size, rt_info);
}

Expand Down

0 comments on commit 95a301e

Please sign in to comment.