|
79 | 79 | ), |
80 | 80 | "Pixtral-12B": partial(Pixtral, model_path="mistralai/Pixtral-12B-2409"), |
81 | 81 | "Falcon2-VLM-11B": partial(Falcon2VLM, model_path="tiiuae/falcon-11B-vlm"), |
| 82 | + # "ming": partial(MingUniVisionInfer, model_name_or_path="/root/autodl-tmp/home/tongyujun/models/Ming-UniVision-16B-A3B"), |
| 83 | + # "ming_replace_refine_psnr": partial(MingUniVisionInfer_REPLACE, model_name_or_path="/root/autodl-tmp/home/tongyujun/models/Ming-UniVision-16B-A3B"), |
| 84 | + # "ming_concat": partial(MingUniVisionInfer_CONCAT, model_name_or_path="/root/autodl-tmp/home/tongyujun/models/Ming-UniVision-16B-A3B"), |
| 85 | + "bagel": partial(BagelInfer, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 86 | + "bagel_ab": partial(BagelInfer, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 87 | + "bagel1": partial(BagelInfer, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 88 | + "bagel2": partial(BagelInfer, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 89 | + |
| 90 | + "bagel_prompt": partial(BagelInfer_concat, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 91 | + "bagel_prompt1": partial(BagelInfer_concat, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 92 | + |
| 93 | + "bagel_concat": partial(BagelInfer_concat, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 94 | + "bagel_zoomin": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 95 | + "bagel_zoomin_think": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 96 | + "bagel_zoomin_thinkv1": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 97 | + "bagel_zoomin_thinkv2": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 98 | + "bagel_zoomin_thinkv3": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 99 | + "bagel_zoomin_thinkv4": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 100 | + "bagel_zoomin_thinkv5": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 101 | + "bagel_zoomin_thinkv6": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 102 | + "bagel_zoomin_thinkv7": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 103 | + "bagel_zoomin_thinkv8": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 104 | + "bagel_zoomin_thinkv9": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 105 | + "bagel_think": partial(BagelInfer_think, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 106 | + |
| 107 | + |
| 108 | + |
| 109 | + "bagel_zoomin_thinkbaseline": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 110 | + |
| 111 | + |
| 112 | + "bagel_zoomin_think_onlyimage": partial(BagelInfer_zoomin, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 113 | + |
| 114 | + "bagel_gpt": partial(BagelInfer_GPT, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 115 | + "bagel_gptv1": partial(BagelInfer_GPT, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 116 | + "bagel_gptv2": partial(BagelInfer_GPT, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 117 | + "bagel_gptv3": partial(BagelInfer_GPT, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 118 | + "bagel_gptv4": partial(BagelInfer_GPT, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 119 | + "bagel_gptv5": partial(BagelInfer_GPT, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 120 | + "bagel_gptv6": partial(BagelInfer_GPT, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 121 | + "bagel_gptv7": partial(BagelInfer_GPT, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 122 | + "bagel_gptv8": partial(BagelInfer_GPT, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 123 | + |
| 124 | + "bagel_seperate_ab_30": partial(BagelInfer_seperate, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 125 | + "bagel_prompt_gen": partial(BagelInfer_prompt_gen, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 126 | + "gpt_prompt_gen": partial(BagelInfer_prompt_gen, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 127 | + "bagel_prompt_gen1": partial(BagelInfer_prompt_gen, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 128 | + "gemini_prompt_gen": partial(BagelInfer_prompt_gen, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 129 | + |
| 130 | + |
| 131 | + # "bagel_replace_psnr": partial(BagelInfer_replace, model_name_or_path="/data/tongyujun/uni-tts/models/BAGEL-7B-MoT"), |
| 132 | + |
82 | 133 | } |
83 | 134 |
|
84 | 135 | o1_key = os.environ.get('O1_API_KEY', None) |
|
127 | 178 | # GPT |
128 | 179 | "GPT4V": partial( |
129 | 180 | GPT4V, |
130 | | - model="gpt-4-1106-vision-preview", |
| 181 | + model="gpt-4-1106-preview", |
131 | 182 | temperature=0, |
132 | 183 | img_size=512, |
133 | 184 | img_detail="low", |
|
279 | 330 | max_tokens=2**14, |
280 | 331 | timeout=300, |
281 | 332 | ), |
| 333 | + "gpt-5.1": partial( |
| 334 | + GPT4V, |
| 335 | + model="gpt-5.1", |
| 336 | + img_detail="high", |
| 337 | + retry=3, |
| 338 | + verbose=False, |
| 339 | + max_tokens=2**14, |
| 340 | + timeout=300, |
| 341 | + ), |
| 342 | + "gpt-4o": partial( |
| 343 | + GPT4V, |
| 344 | + model="gpt-4o", |
| 345 | + img_detail="high", |
| 346 | + retry=3, |
| 347 | + verbose=False, |
| 348 | + max_tokens=2**14, |
| 349 | + timeout=300, |
| 350 | + ), |
| 351 | + # "Gemini-3-pro": partial( |
| 352 | + # GPT4V, |
| 353 | + # model="gemini-3-pro-preview", |
| 354 | + # img_detail="high", |
| 355 | + # retry=3, |
| 356 | + # verbose=False, |
| 357 | + # max_tokens=2**14, |
| 358 | + # timeout=300, |
| 359 | + # key='sk-ZmMmKKNPeShHLRKwHjXA68GXN2AmjHvnYEgnYDYqtb9gcQbo' |
| 360 | + # ), |
| 361 | + |
282 | 362 | # Gemini |
283 | 363 | "GeminiPro1-0": partial( |
284 | 364 | Gemini, model="gemini-1.0-pro", temperature=0, retry=10 |
|
295 | 375 | "GeminiFlash1-5-002": partial( |
296 | 376 | GPT4V, model="gemini-1.5-flash-002", temperature=0, retry=10 |
297 | 377 | ), # Internal Use Only |
| 378 | + "Gemini-3-pro": partial( |
| 379 | + GPT4V, model="gemini-3-pro-all", temperature=0, retry=10 |
| 380 | + ), |
| 381 | + "Gemini-2.5-pro": partial( |
| 382 | + GPT4V, model="gemini-2.5-pro-nothinking", temperature=0, retry=10 |
| 383 | + ), |
298 | 384 | "GeminiFlash2-0": partial( |
299 | 385 | Gemini, model="gemini-2.0-flash", temperature=0, retry=10 |
300 | 386 | ), |
|
307 | 393 | "GeminiPro2-5": partial( |
308 | 394 | Gemini, model="gemini-2.5-pro", temperature=0, retry=10 |
309 | 395 | ), |
| 396 | + |
| 397 | + #DS |
| 398 | + "DS-vl": partial( |
| 399 | + GPT4V, model="deepseek-vl2", temperature=0, retry=10 |
| 400 | + ), |
310 | 401 |
|
311 | 402 | # Qwen-VL |
312 | 403 | "QwenVLPlus": partial(QwenVLAPI, model="qwen-vl-plus", temperature=0, retry=10), |
313 | 404 | "QwenVLMax": partial(QwenVLAPI, model="qwen-vl-max", temperature=0, retry=10), |
314 | 405 | "QwenVLMax-250408": partial(QwenVLAPI, model="qwen-vl-max-2025-04-08", temperature=0, retry=10), |
| 406 | + "Qwen3VLPlus": partial(QwenVLAPI, model="qwen3-vl-plus", temperature=0, retry=10, key='sk-3a658ecf56284de185b5960e9b059745'), |
| 407 | + "Qwen3VL-A3B-30B": partial(QwenVLAPI, model="qwen3-vl-30b-a3b-instruct", temperature=0, retry=10, key='sk-3a658ecf56284de185b5960e9b059745'), |
| 408 | + "Qwen3vl-235b-a22b": partial(QwenVLAPI, model="qwen3-vl-235b-a22b-instruct", temperature=0, retry=10, key='sk-3a658ecf56284de185b5960e9b059745'), |
| 409 | + "Qwen3vl-8b": partial(QwenVLAPI, model="qwen3-vl-8b-instruct", temperature=0, retry=10, key='sk-3a658ecf56284de185b5960e9b059745'), |
| 410 | + "Qwen2.5vl-7b": partial(QwenVLAPI, model="qwen2.5-vl-7b-instruct", temperature=0, retry=10, key='sk-3a658ecf56284de185b5960e9b059745'), |
| 411 | + "Qwen2.5vl-72b": partial(QwenVLAPI, model="qwen2.5-vl-72b-instruct", temperature=0, retry=10, key='sk-3a658ecf56284de185b5960e9b059745'), |
315 | 412 |
|
316 | 413 | # Reka |
317 | 414 | "RekaEdge": partial(Reka, model="reka-edge-20240208"), |
|
1341 | 1438 | ), |
1342 | 1439 | "Qwen2.5-VL-7B-Instruct": partial( |
1343 | 1440 | Qwen2VLChat, |
1344 | | - model_path="Qwen/Qwen2.5-VL-7B-Instruct", |
| 1441 | + model_path="/root/autodl-tmp/home/tongyujun/models/Qwen2.5-VL-7B-Instruct", |
1345 | 1442 | min_pixels=1280 * 28 * 28, |
1346 | 1443 | max_pixels=16384 * 28 * 28, |
1347 | 1444 | use_custom_prompt=False, |
|
0 commit comments