1010n_frames = 4
1111topk = 5
1212action_representation = 'GT_random_narration'
13- gpt_model = 'gpt-4o-mini-2024-07-18'
14- # gpt_model = 'gpt-4o-2024-08-06'
15- perspective = 'third_person'
13+ #gpt_model = 'gpt-4o-mini-2024-07-18'
14+ gpt_model = 'gpt-4o-2024-08-06'
15+ perspective = 'first_person'
16+ benchmark_testing = True
1617
1718
1819def benchmark_avion_mcq (n_samples ):
@@ -26,6 +27,7 @@ def benchmark_avion_mcq(n_samples):
2627 question_type = 'mc_' ,
2728 action_representation = action_representation ,
2829 perspective = perspective ,
30+ benchmark_testing = benchmark_testing ,
2931 topk = topk )
3032 inferencer .multi_process_run (n_samples )
3133
@@ -40,6 +42,7 @@ def benchmark_tim_mcq(n_samples):
4042 question_type = 'mc_' ,
4143 action_representation = action_representation ,
4244 perspective = perspective ,
45+ benchmark_testing = benchmark_testing ,
4346 topk = topk )
4447 inferencer .multi_process_run (n_samples )
4548
@@ -53,6 +56,7 @@ def benchmark_random_mcq(n_samples):
5356 question_type = 'mc_' ,
5457 action_representation = action_representation ,
5558 perspective = perspective ,
59+ benchmark_testing = benchmark_testing ,
5660 topk = topk )
5761
5862 inferencer .multi_process_run (n_samples )
@@ -61,4 +65,4 @@ def benchmark_random_mcq(n_samples):
6165if __name__ == '__main__' :
6266 benchmark_avion_mcq (100 )
6367 benchmark_tim_mcq (100 )
64- benchmark_random_mcq (100 )
68+ # benchmark_random_mcq(100)
0 commit comments