|
385 | 385 | ), |
386 | 386 | "minicpmo_26": VLMTestInfo( |
387 | 387 | models=["openbmb/MiniCPM-o-2_6"], |
388 | | - test_type=(VLMTestType.IMAGE), |
389 | | - prompt_formatter=lambda img_prompt: f"<|begin_of_text|><|start_header_id|>user<|end_header_id|>\n\n{img_prompt}<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n", # noqa: E501 |
390 | | - img_idx_to_prompt=lambda idx: "(<image>./</image>)\n", |
391 | | - max_model_len=4096, |
392 | | - max_num_seqs=2, |
393 | | - get_stop_token_ids=lambda tok: tok.convert_tokens_to_ids(['<|im_end|>', '<|endoftext|>']), # noqa: E501 |
394 | | - hf_output_post_proc=model_utils.minicpmv_trunc_hf_output, |
395 | | - patch_hf_runner=model_utils.minicpmo_26_patch_hf_runner, |
396 | | - ), |
397 | | - "minicpmo_26_multi_image": VLMTestInfo( |
398 | | - models=["openbmb/MiniCPM-o-2_6"], |
399 | | - test_type=(VLMTestType.MULTI_IMAGE), |
| 388 | + test_type=(VLMTestType.IMAGE, VLMTestType.MULTI_IMAGE), |
400 | 389 | prompt_formatter=lambda img_prompt: f"<|begin_of_text|><|start_header_id|>user<|end_header_id|>\n\n{img_prompt}<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n", # noqa: E501 |
401 | 390 | img_idx_to_prompt=lambda idx: "(<image>./</image>)\n", |
402 | 391 | max_model_len=4096, |
403 | 392 | max_num_seqs=2, |
404 | 393 | get_stop_token_ids=lambda tok: tok.convert_tokens_to_ids(['<|im_end|>', '<|endoftext|>']), # noqa: E501 |
405 | 394 | hf_output_post_proc=model_utils.minicpmv_trunc_hf_output, |
406 | 395 | patch_hf_runner=model_utils.minicpmo_26_patch_hf_runner, |
407 | | - marks=[large_gpu_mark(min_gb=32)], |
408 | 396 | ), |
409 | 397 | "minicpmv_26": VLMTestInfo( |
410 | 398 | models=["openbmb/MiniCPM-V-2_6"], |
411 | | - test_type=(VLMTestType.IMAGE), |
412 | | - prompt_formatter=lambda img_prompt: f"<|begin_of_text|><|start_header_id|>user<|end_header_id|>\n\n{img_prompt}<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n", # noqa: E501 |
413 | | - img_idx_to_prompt=lambda idx: "(<image>./</image>)\n", |
414 | | - max_model_len=4096, |
415 | | - max_num_seqs=2, |
416 | | - get_stop_token_ids=lambda tok: tok.convert_tokens_to_ids(['<|im_end|>', '<|endoftext|>']), # noqa: E501 |
417 | | - hf_output_post_proc=model_utils.minicpmv_trunc_hf_output, |
418 | | - patch_hf_runner=model_utils.minicpmv_26_patch_hf_runner, |
419 | | - ), |
420 | | - "minicpmv_26_multi_image": VLMTestInfo( |
421 | | - models=["openbmb/MiniCPM-V-2_6"], |
422 | | - test_type=(VLMTestType.MULTI_IMAGE), |
| 399 | + test_type=(VLMTestType.IMAGE, VLMTestType.MULTI_IMAGE), |
423 | 400 | prompt_formatter=lambda img_prompt: f"<|begin_of_text|><|start_header_id|>user<|end_header_id|>\n\n{img_prompt}<|eot_id|><|start_header_id|>assistant<|end_header_id|>\n\n", # noqa: E501 |
424 | 401 | img_idx_to_prompt=lambda idx: "(<image>./</image>)\n", |
425 | 402 | max_model_len=4096, |
426 | 403 | max_num_seqs=2, |
427 | 404 | get_stop_token_ids=lambda tok: tok.convert_tokens_to_ids(['<|im_end|>', '<|endoftext|>']), # noqa: E501 |
428 | 405 | hf_output_post_proc=model_utils.minicpmv_trunc_hf_output, |
429 | 406 | patch_hf_runner=model_utils.minicpmv_26_patch_hf_runner, |
430 | | - marks=[large_gpu_mark(min_gb=32)], |
431 | 407 | ), |
432 | 408 | "molmo": VLMTestInfo( |
433 | 409 | models=["allenai/Molmo-7B-D-0924"], |
|
0 commit comments