-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy patheval_qwen_generative.sh
More file actions
42 lines (35 loc) · 1.57 KB
/
eval_qwen_generative.sh
File metadata and controls
42 lines (35 loc) · 1.57 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
#!/bin/bash
# Copyright (c) Meta Platforms, Inc. and affiliates.
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
# http://www.apache.org/licenses/LICENSE-2.0
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
export PYTHONPATH="$(pwd):$PYTHONPATH"
ROOT_DIR=/PATH/TO/BENCHMARK_ROOT
torchrun --nnodes=1 --nproc-per-node=1 --max-restarts=1 \
evals/cli/multimodal_eval.py \
--tasks maestro_ob2 \
--dataset_dir $ROOT_DIR/ob2/clipped_videos \
--model_path $ROOT_DIR/models/Qwen2.5-VL-72B-Instruct/ \
--predictor_name maestro_ob2_qwen \
--task_args '{
"maestro_ob2-maestro_ob2_qwen": {
"jsonl_dataset_path": "'$ROOT_DIR'/ob2/structured_goals.json",
"max_gen_len": 1024,
"digital_key_only": "0",
"longitudinal_positive_only": "0",
"transcription_dataset_path": "'$ROOT_DIR'/ob2/ob2_transcriptions_250501.json",
"digital_state_path": "'$ROOT_DIR'/ob2/digital_state_v2.4.4.json",
"longitudinal_history_path": "'$ROOT_DIR'/ob2/structured_goals_longitudinal_history_v244.json"
}
}' \
--dump_dir $ROOT_DIR/evals_runs \
--number_of_samples 32 \
--mode generative \
--judge_path $ROOT_DIR/models/DeepSeek-R1-Distill-Llama-70B \
--device_map auto