@@ -896,7 +896,8 @@ void ov::npuw::LLMInferRequest::infer_generate(ov::SoPtr<ov::ITensor> input_ids,
896896 uu::fill_tensor_bytes (m_kvcache_request->get_tensor (m_kvcache_in_ports.at (m_input_ids_name)), 0u );
897897 uu::fill_tensor<int64_t >(m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::attention_mask)),
898898 0 );
899- uu::fill_tensor<int64_t >(m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::position_ids)), 0 );
899+ uu::fill_tensor<int64_t >(m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::position_ids)),
900+ 0 );
900901 if (token_type_ids) {
901902 uu::fill_tensor<int64_t >(
902903 m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::token_type_ids)),
@@ -928,8 +929,7 @@ void ov::npuw::LLMInferRequest::infer_generate(ov::SoPtr<ov::ITensor> input_ids,
928929 input_ids->get_byte_size ());
929930
930931 if (token_type_ids) {
931- auto kv_token_type_ids =
932- m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::token_type_ids));
932+ auto kv_token_type_ids = m_kvcache_request->get_tensor (m_kvcache_in_ports.at (layer_names::token_type_ids));
933933 util::copy_to_right (token_type_ids, kv_token_type_ids);
934934 }
935935
@@ -942,10 +942,10 @@ void ov::npuw::LLMInferRequest::infer_generate(ov::SoPtr<ov::ITensor> input_ids,
942942 attention_mask->get_size () - input_tokens_len,
943943 kv_attn_mask->data <int64_t >());
944944 if (input_tokens_len < kvcache_desc.max_generation_token_len ) {
945- std::fill_n (kv_attn_mask-> data < int64_t >() + kv_attn_mask-> get_size () -
946- kvcache_desc.max_generation_token_len ,
947- kvcache_desc.max_generation_token_len - input_tokens_len,
948- 0 );
945+ std::fill_n (
946+ kv_attn_mask-> data < int64_t >() + kv_attn_mask-> get_size () - kvcache_desc.max_generation_token_len ,
947+ kvcache_desc.max_generation_token_len - input_tokens_len,
948+ 0 );
949949 }
950950 std::fill_n (kv_attn_mask->data <int64_t >() + kv_attn_mask->get_size () - input_tokens_len, input_tokens_len, 1 );
951951
0 commit comments