@@ -882,7 +882,8 @@ void ov::npuw::LLMInferRequest::infer_generate(ov::SoPtr<ov::ITensor> input_ids,
882882 uu::fill_tensor_bytes (m_kvcache_request->get_tensor (m_kvcache_in_ports.at (m_input_ids_name)), 0u );
883883 uu::fill_tensor<int64_t >(m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::attention_mask)),
884884 0 );
885- uu::fill_tensor<int64_t >(m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::position_ids)), 0 );
885+ uu::fill_tensor<int64_t >(m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::position_ids)),
886+ 0 );
886887 if (token_type_ids) {
887888 uu::fill_tensor<int64_t >(
888889 m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::token_type_ids)),
@@ -914,8 +915,7 @@ void ov::npuw::LLMInferRequest::infer_generate(ov::SoPtr<ov::ITensor> input_ids,
914915 input_ids->get_byte_size ());
915916
916917 if (token_type_ids) {
917- auto kv_token_type_ids =
918- m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::token_type_ids));
918+ auto kv_token_type_ids = m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::token_type_ids));
919919 util::copy_to_right (token_type_ids, kv_token_type_ids);
920920 }
921921
@@ -928,10 +928,10 @@ void ov::npuw::LLMInferRequest::infer_generate(ov::SoPtr<ov::ITensor> input_ids,
928928 attention_mask->get_size () - input_tokens_len,
929929 kv_attn_mask->data <int64_t >());
930930 if (input_tokens_len < kvcache_desc.max_generation_token_len ) {
931- std::fill_n (kv_attn_mask-> data < int64_t >() + kv_attn_mask-> get_size () -
932- kvcache_desc.max_generation_token_len ,
933- kvcache_desc.max_generation_token_len - input_tokens_len,
934- 0 );
931+ std::fill_n (
932+ kv_attn_mask-> data < int64_t >() + kv_attn_mask-> get_size () - kvcache_desc.max_generation_token_len ,
933+ kvcache_desc.max_generation_token_len - input_tokens_len,
934+ 0 );
935935 }
936936 std::fill_n (kv_attn_mask->data <int64_t >() + kv_attn_mask->get_size () - input_tokens_len, input_tokens_len, 1 );
937937
0 commit comments