1717import llm_bench_utils .output_file
1818import llm_bench_utils .gen_output_data as gen_output_data
1919import llm_bench_utils .parse_json_data as parse_json_data
20+ import llm_bench_utils .prompt_utils as pu
2021from pathlib import Path
2122
22-
2323FW_UTILS = {'pt' : llm_bench_utils .pt_utils , 'ov' : llm_bench_utils .ov_utils }
2424
2525DEFAULT_OUTPUT_TOKEN_SIZE = 512
@@ -37,13 +37,20 @@ def run_visual_language_generation_optimum(
3737 prompts = []
3838 inputs = [inputs ] if not isinstance (inputs , (list , tuple )) else inputs
3939 for input_data in inputs :
40- if input_data .get ("media" , None ):
40+ if input_data .get ("video" , None ):
41+ entry = Path (input_data ["video" ])
42+ required_frames = args .get ('video_frames' )
43+ ordered_frames = pu .split_video_into_frames (entry , required_frames )
44+ images .extend (ordered_frames )
45+
46+ elif input_data .get ("media" , None ):
4147 entry = Path (input_data ["media" ])
4248 if entry .is_dir ():
4349 for file in sorted (entry .iterdir ()):
4450 images .append (load_image (str (file )))
45- else :
46- images .append (load_image (input_data ["media" ]))
51+ else : images .append (load_image (input_data ["media" ]))
52+
53+
4754 prompts .append (input_data ["prompt" ])
4855 prefix = '[warm-up]' if num == 0 else '[{}]' .format (num )
4956 log .info (f'{ prefix } [P{ prompt_index } ] Input image nums:{ len (images )} ' )
@@ -365,14 +372,13 @@ def run_visual_language_generation_benchmark(model_path, framework, device, args
365372
366373def get_image_text_prompt (args ):
367374 vlm_file_list = []
368- output_data_list , is_json_data = model_utils .get_param_from_file (args , [' media' , "prompt" ])
375+ output_data_list , is_json_data = model_utils .get_param_from_file (args , [" media" , "prompt" ])
369376 if is_json_data :
370377 vlm_param_list = parse_json_data .parse_vlm_json_data (output_data_list )
371378 if len (vlm_param_list ) > 0 :
372379 for vlm_file in vlm_param_list :
373380 if args ['prompt_file' ] is not None and len (args ['prompt_file' ]) > 0 :
374381 vlm_file ['media' ] = model_utils .resolve_media_file_path (vlm_file .get ("media" ), args ['prompt_file' ][0 ])
375382 vlm_file_list .append (vlm_file )
376- else :
377- vlm_file_list .append (output_data_list )
383+ else : vlm_file_list .append (output_data_list )
378384 return vlm_file_list
0 commit comments