|
15 | 15 |
|
16 | 16 | from otx.core.types.task import OTXTaskType |
17 | 17 |
|
| 18 | +CLASSIFICATION_BENCHMARK_CRITERIA = [ |
| 19 | + Criterion(name="train/epoch", summary="max", compare="<", margin=0.1), |
| 20 | + Criterion(name="train/e2e_time", summary="max", compare="<", margin=0.1), |
| 21 | + Criterion(name="train/gpu_mem", summary="max", compare="<", margin=0.1), |
| 22 | + Criterion(name="val/accuracy", summary="max", compare=">", margin=0.1), |
| 23 | + Criterion(name="test/accuracy", summary="max", compare=">", margin=0.1), |
| 24 | + Criterion(name="export/accuracy", summary="max", compare=">", margin=0.1), |
| 25 | + Criterion(name="optimize/accuracy", summary="max", compare=">", margin=0.1), |
| 26 | + Criterion(name="train/iter_time", summary="mean", compare="<", margin=0.1), |
| 27 | + Criterion(name="test/iter_time", summary="mean", compare="<", margin=0.1), |
| 28 | + Criterion(name="export/iter_time", summary="mean", compare="<", margin=0.1), |
| 29 | + Criterion(name="optimize/iter_time", summary="mean", compare="<", margin=0.1), |
| 30 | + Criterion(name="optimize/e2e_time", summary="mean", compare="<", margin=0.1), |
| 31 | + Criterion(name="test(torch)/latency", summary="mean", compare="<", margin=0.1), |
| 32 | + Criterion(name="test(export)/latency", summary="mean", compare="<", margin=0.1), |
| 33 | + Criterion(name="test(optimize)/latency", summary="mean", compare="<", margin=0.1), |
| 34 | + Criterion(name="test(train)/e2e_time", summary="max", compare=">", margin=0.1), |
| 35 | + Criterion(name="test(export)/e2e_time", summary="max", compare=">", margin=0.1), |
| 36 | + Criterion(name="test(optimize)/e2e_time", summary="max", compare=">", margin=0.1), |
| 37 | +] |
| 38 | + |
| 39 | + |
18 | 40 | # ============= Multi-class classification ============= |
19 | 41 |
|
20 | 42 | MULTI_CLASS_MODEL_TEST_CASES = [ |
|
51 | 73 | ), |
52 | 74 | ] |
53 | 75 |
|
54 | | -# TODO (someone): Compare with DETECTION CRITERIA and fill in the missing values |
55 | | -MULTI_CLASS_BENCHMARK_CRITERIA = [ |
56 | | - Criterion(name="train/epoch", summary="max", compare="<", margin=0.1), |
57 | | - Criterion(name="train/e2e_time", summary="max", compare="<", margin=0.1), |
58 | | - Criterion(name="val/accuracy", summary="max", compare=">", margin=0.1), |
59 | | - Criterion(name="test/accuracy", summary="max", compare=">", margin=0.1), |
60 | | - Criterion(name="export/accuracy", summary="max", compare=">", margin=0.1), |
61 | | - Criterion(name="optimize/accuracy", summary="max", compare=">", margin=0.1), |
62 | | - Criterion(name="train/iter_time", summary="mean", compare="<", margin=0.1), |
63 | | - Criterion(name="test/iter_time", summary="mean", compare="<", margin=0.1), |
64 | | - Criterion(name="export/iter_time", summary="mean", compare="<", margin=0.1), |
65 | | - Criterion(name="optimize/iter_time", summary="mean", compare="<", margin=0.1), |
66 | | - Criterion(name="test(train)/e2e_time", summary="max", compare=">", margin=0.1), |
67 | | - Criterion(name="test(export)/e2e_time", summary="max", compare=">", margin=0.1), |
68 | | - Criterion(name="test(optimize)/e2e_time", summary="max", compare=">", margin=0.1), |
69 | | -] |
70 | | - |
71 | 76 |
|
72 | 77 | # ============= Multi-label classification ============= |
73 | 78 | MULTI_LABEL_MODEL_TEST_CASES = [ |
|
100 | 105 | ), |
101 | 106 | ] |
102 | 107 |
|
103 | | -# TODO (someone): Compare with DETECTION CRITERIA and fill in the missing values |
104 | | -MULTI_LABEL_BENCHMARK_CRITERIA = [ |
105 | | - Criterion(name="train/epoch", summary="max", compare="<", margin=0.1), |
106 | | - Criterion(name="train/e2e_time", summary="max", compare="<", margin=0.1), |
107 | | - Criterion(name="val/accuracy", summary="max", compare=">", margin=0.1), |
108 | | - Criterion(name="test/accuracy", summary="max", compare=">", margin=0.1), |
109 | | - Criterion(name="export/accuracy", summary="max", compare=">", margin=0.1), |
110 | | - Criterion(name="optimize/accuracy", summary="max", compare=">", margin=0.1), |
111 | | - Criterion(name="train/iter_time", summary="mean", compare="<", margin=0.1), |
112 | | - Criterion(name="test/iter_time", summary="mean", compare="<", margin=0.1), |
113 | | - Criterion(name="export/iter_time", summary="mean", compare="<", margin=0.1), |
114 | | - Criterion(name="optimize/iter_time", summary="mean", compare="<", margin=0.1), |
115 | | - Criterion(name="test(train)/e2e_time", summary="max", compare=">", margin=0.1), |
116 | | - Criterion(name="test(export)/e2e_time", summary="max", compare=">", margin=0.1), |
117 | | - Criterion(name="test(optimize)/e2e_time", summary="max", compare=">", margin=0.1), |
118 | | -] |
119 | | - |
120 | 108 |
|
121 | 109 | # ============= Hierarchical-label classification ============= |
122 | 110 |
|
|
150 | 138 | extra_overrides={}, |
151 | 139 | ), |
152 | 140 | ] |
153 | | - |
154 | | -# TODO (someone): Compare with DETECTION CRITERIA and fill in the missing values |
155 | | -H_LABEL_CLS_BENCHMARK_CRITERIA = [ |
156 | | - Criterion(name="train/epoch", summary="max", compare="<", margin=0.1), |
157 | | - Criterion(name="train/e2e_time", summary="max", compare="<", margin=0.1), |
158 | | - Criterion(name="val/accuracy", summary="max", compare=">", margin=0.1), |
159 | | - Criterion(name="test/accuracy", summary="max", compare=">", margin=0.1), |
160 | | - Criterion(name="export/accuracy", summary="max", compare=">", margin=0.1), |
161 | | - Criterion(name="optimize/accuracy", summary="max", compare=">", margin=0.1), |
162 | | - Criterion(name="train/iter_time", summary="mean", compare="<", margin=0.1), |
163 | | - Criterion(name="test/iter_time", summary="mean", compare="<", margin=0.1), |
164 | | - Criterion(name="export/iter_time", summary="mean", compare="<", margin=0.1), |
165 | | - Criterion(name="optimize/iter_time", summary="mean", compare="<", margin=0.1), |
166 | | - Criterion(name="test(train)/e2e_time", summary="max", compare=">", margin=0.1), |
167 | | - Criterion(name="test(export)/e2e_time", summary="max", compare=">", margin=0.1), |
168 | | - Criterion(name="test(optimize)/e2e_time", summary="max", compare=">", margin=0.1), |
169 | | -] |
0 commit comments