xref: /aosp_15_r20/external/pytorch/benchmarks/dynamo/torchbench.yaml (revision da0073e96a02ea20f0ac840b70461e3646d07c45)
1*da0073e9SAndroid Build Coastguard Worker# Some models have large dataset that doesn't fit in memory. Lower the batch
2*da0073e9SAndroid Build Coastguard Worker# size to test the accuracy.
3*da0073e9SAndroid Build Coastguard Workerbatch_size:
4*da0073e9SAndroid Build Coastguard Worker  training:
5*da0073e9SAndroid Build Coastguard Worker    demucs: 4
6*da0073e9SAndroid Build Coastguard Worker    dlrm: 1024
7*da0073e9SAndroid Build Coastguard Worker    densenet121: 4
8*da0073e9SAndroid Build Coastguard Worker    hf_Reformer: 4
9*da0073e9SAndroid Build Coastguard Worker    hf_T5_base: 4
10*da0073e9SAndroid Build Coastguard Worker    timm_efficientdet: 1
11*da0073e9SAndroid Build Coastguard Worker    llama_v2_7b_16h: 1
12*da0073e9SAndroid Build Coastguard Worker    # reduced from 16 due to cudagraphs OOM in TorchInductor dashboard
13*da0073e9SAndroid Build Coastguard Worker    yolov3: 8
14*da0073e9SAndroid Build Coastguard Worker
15*da0073e9SAndroid Build Coastguard Worker  inference:
16*da0073e9SAndroid Build Coastguard Worker    timm_efficientdet: 32
17*da0073e9SAndroid Build Coastguard Worker
18*da0073e9SAndroid Build Coastguard Worker
19*da0073e9SAndroid Build Coastguard Workerdont_change_batch_size:
20*da0073e9SAndroid Build Coastguard Worker  - demucs
21*da0073e9SAndroid Build Coastguard Worker  - pytorch_struct
22*da0073e9SAndroid Build Coastguard Worker  - pyhpc_turbulent_kinetic_energy
23*da0073e9SAndroid Build Coastguard Worker  # https://github.com/pytorch/benchmark/pull/1656
24*da0073e9SAndroid Build Coastguard Worker  - vision_maskrcnn
25*da0073e9SAndroid Build Coastguard Worker
26*da0073e9SAndroid Build Coastguard Worker
27*da0073e9SAndroid Build Coastguard Workertolerance:
28*da0073e9SAndroid Build Coastguard Worker  # Need lower tolerance on GPU. GPU kernels have non deterministic kernels for these models.
29*da0073e9SAndroid Build Coastguard Worker  higher:
30*da0073e9SAndroid Build Coastguard Worker    - alexnet
31*da0073e9SAndroid Build Coastguard Worker    - attention_is_all_you_need_pytorch
32*da0073e9SAndroid Build Coastguard Worker    - densenet121
33*da0073e9SAndroid Build Coastguard Worker    - hf_Albert
34*da0073e9SAndroid Build Coastguard Worker    - vgg16
35*da0073e9SAndroid Build Coastguard Worker    - mobilenet_v3_large
36*da0073e9SAndroid Build Coastguard Worker    - nvidia_deeprecommender
37*da0073e9SAndroid Build Coastguard Worker    - timm_efficientdet
38*da0073e9SAndroid Build Coastguard Worker
39*da0073e9SAndroid Build Coastguard Worker  # These models need >1e-3 tolerance
40*da0073e9SAndroid Build Coastguard Worker  even_higher:
41*da0073e9SAndroid Build Coastguard Worker    - soft_actor_critic
42*da0073e9SAndroid Build Coastguard Worker    - tacotron2
43*da0073e9SAndroid Build Coastguard Worker    - yolov3
44*da0073e9SAndroid Build Coastguard Worker    - timm_efficientdet
45*da0073e9SAndroid Build Coastguard Worker    - squeezenet1_1
46*da0073e9SAndroid Build Coastguard Worker
47*da0073e9SAndroid Build Coastguard Worker  higher_fp16:
48*da0073e9SAndroid Build Coastguard Worker    - doctr_reco_predictor
49*da0073e9SAndroid Build Coastguard Worker    - drq
50*da0073e9SAndroid Build Coastguard Worker    - hf_Whisper
51*da0073e9SAndroid Build Coastguard Worker
52*da0073e9SAndroid Build Coastguard Worker  higher_bf16:
53*da0073e9SAndroid Build Coastguard Worker    - doctr_reco_predictor
54*da0073e9SAndroid Build Coastguard Worker    - drq
55*da0073e9SAndroid Build Coastguard Worker    - hf_Whisper
56*da0073e9SAndroid Build Coastguard Worker
57*da0073e9SAndroid Build Coastguard Worker  cosine: []
58*da0073e9SAndroid Build Coastguard Worker
59*da0073e9SAndroid Build Coastguard Workerrequire_larger_multiplier_for_smaller_tensor:
60*da0073e9SAndroid Build Coastguard Worker  - yolov3
61*da0073e9SAndroid Build Coastguard Worker
62*da0073e9SAndroid Build Coastguard Worker# These benchmarks took >600s on an i9-11900K CPU
63*da0073e9SAndroid Build Coastguard Workervery_slow: &VERY_SLOW_MODELS
64*da0073e9SAndroid Build Coastguard Worker  # 3339s
65*da0073e9SAndroid Build Coastguard Worker  - hf_BigBird
66*da0073e9SAndroid Build Coastguard Worker  # 3062s
67*da0073e9SAndroid Build Coastguard Worker  - hf_Longformer
68*da0073e9SAndroid Build Coastguard Worker  # 930s
69*da0073e9SAndroid Build Coastguard Worker  - hf_T5
70*da0073e9SAndroid Build Coastguard Worker
71*da0073e9SAndroid Build Coastguard Worker
72*da0073e9SAndroid Build Coastguard Worker# These benchmarks took >60s on an i9-11900K CPU
73*da0073e9SAndroid Build Coastguard Workerslow:
74*da0073e9SAndroid Build Coastguard Worker  - *VERY_SLOW_MODELS
75*da0073e9SAndroid Build Coastguard Worker  # 137s
76*da0073e9SAndroid Build Coastguard Worker  - BERT_pytorch
77*da0073e9SAndroid Build Coastguard Worker  # 116s
78*da0073e9SAndroid Build Coastguard Worker  - demucs
79*da0073e9SAndroid Build Coastguard Worker  # 242s
80*da0073e9SAndroid Build Coastguard Worker  - fastNLP_Bert
81*da0073e9SAndroid Build Coastguard Worker  # 221s
82*da0073e9SAndroid Build Coastguard Worker  - hf_Albert
83*da0073e9SAndroid Build Coastguard Worker  # 400s
84*da0073e9SAndroid Build Coastguard Worker  - hf_Bart
85*da0073e9SAndroid Build Coastguard Worker  # 334s
86*da0073e9SAndroid Build Coastguard Worker  - hf_Bert
87*da0073e9SAndroid Build Coastguard Worker  # 187s
88*da0073e9SAndroid Build Coastguard Worker  - hf_DistilBert
89*da0073e9SAndroid Build Coastguard Worker  # 470s
90*da0073e9SAndroid Build Coastguard Worker  - hf_GPT2
91*da0073e9SAndroid Build Coastguard Worker  # 141s
92*da0073e9SAndroid Build Coastguard Worker  - hf_Reformer
93*da0073e9SAndroid Build Coastguard Worker  # 317s
94*da0073e9SAndroid Build Coastguard Worker  - speech_transformer
95*da0073e9SAndroid Build Coastguard Worker  # 99s
96*da0073e9SAndroid Build Coastguard Worker  - vision_maskrcnn
97*da0073e9SAndroid Build Coastguard Worker
98*da0073e9SAndroid Build Coastguard Worker
99*da0073e9SAndroid Build Coastguard Workernon_deterministic:
100*da0073e9SAndroid Build Coastguard Worker  # https://github.com/pytorch/pytorch/issues/98355
101*da0073e9SAndroid Build Coastguard Worker  - mobilenet_v3_large
102*da0073e9SAndroid Build Coastguard Worker  - sam_fast
103*da0073e9SAndroid Build Coastguard Worker
104*da0073e9SAndroid Build Coastguard Worker
105*da0073e9SAndroid Build Coastguard Workerdtype:
106*da0073e9SAndroid Build Coastguard Worker  force_amp_for_fp16_bf16_models:
107*da0073e9SAndroid Build Coastguard Worker    - DALLE2_pytorch
108*da0073e9SAndroid Build Coastguard Worker    - doctr_det_predictor
109*da0073e9SAndroid Build Coastguard Worker    - doctr_reco_predictor
110*da0073e9SAndroid Build Coastguard Worker    - Super_SloMo
111*da0073e9SAndroid Build Coastguard Worker    - tts_angular
112*da0073e9SAndroid Build Coastguard Worker    - pyhpc_turbulent_kinetic_energy
113*da0073e9SAndroid Build Coastguard Worker    - detectron2_fcos_r_50_fpn
114*da0073e9SAndroid Build Coastguard Worker
115*da0073e9SAndroid Build Coastguard Worker  force_fp16_for_bf16_models:
116*da0073e9SAndroid Build Coastguard Worker    - vision_maskrcnn
117*da0073e9SAndroid Build Coastguard Worker
118*da0073e9SAndroid Build Coastguard Worker
119*da0073e9SAndroid Build Coastguard Worker# models in canary_models that we should run anyway
120*da0073e9SAndroid Build Coastguard Workercanary_models:
121*da0073e9SAndroid Build Coastguard Worker  - torchrec_dlrm
122*da0073e9SAndroid Build Coastguard Worker
123*da0073e9SAndroid Build Coastguard Worker
124*da0073e9SAndroid Build Coastguard Workerdetectron2_models: &DETECTRON2_MODELS
125*da0073e9SAndroid Build Coastguard Worker  - detectron2_fasterrcnn_r_101_c4
126*da0073e9SAndroid Build Coastguard Worker  - detectron2_fasterrcnn_r_101_dc5
127*da0073e9SAndroid Build Coastguard Worker  - detectron2_fasterrcnn_r_101_fpn
128*da0073e9SAndroid Build Coastguard Worker  - detectron2_fasterrcnn_r_50_c4
129*da0073e9SAndroid Build Coastguard Worker  - detectron2_fasterrcnn_r_50_dc5
130*da0073e9SAndroid Build Coastguard Worker  - detectron2_fasterrcnn_r_50_fpn
131*da0073e9SAndroid Build Coastguard Worker  - detectron2_maskrcnn_r_101_c4
132*da0073e9SAndroid Build Coastguard Worker  - detectron2_maskrcnn_r_101_fpn
133*da0073e9SAndroid Build Coastguard Worker  - detectron2_maskrcnn_r_50_fpn
134*da0073e9SAndroid Build Coastguard Worker
135*da0073e9SAndroid Build Coastguard Worker
136*da0073e9SAndroid Build Coastguard Worker# These models support only train mode. So accuracy checking can't be done in
137*da0073e9SAndroid Build Coastguard Worker# eval mode.
138*da0073e9SAndroid Build Coastguard Workeronly_training:
139*da0073e9SAndroid Build Coastguard Worker  - *DETECTRON2_MODELS
140*da0073e9SAndroid Build Coastguard Worker  - tts_angular
141*da0073e9SAndroid Build Coastguard Worker  - tacotron2
142*da0073e9SAndroid Build Coastguard Worker  - demucs
143*da0073e9SAndroid Build Coastguard Worker  - hf_Reformer
144*da0073e9SAndroid Build Coastguard Worker  - pytorch_struct
145*da0073e9SAndroid Build Coastguard Worker  - yolov3
146*da0073e9SAndroid Build Coastguard Worker
147*da0073e9SAndroid Build Coastguard Worker
148*da0073e9SAndroid Build Coastguard Workertrt_not_yet_working:
149*da0073e9SAndroid Build Coastguard Worker  - alexnet
150*da0073e9SAndroid Build Coastguard Worker  - resnet18
151*da0073e9SAndroid Build Coastguard Worker  - resnet50
152*da0073e9SAndroid Build Coastguard Worker  - mobilenet_v2
153*da0073e9SAndroid Build Coastguard Worker  - mnasnet1_0
154*da0073e9SAndroid Build Coastguard Worker  - squeezenet1_1
155*da0073e9SAndroid Build Coastguard Worker  - shufflenetv2_x1_0
156*da0073e9SAndroid Build Coastguard Worker  - vgg16
157*da0073e9SAndroid Build Coastguard Worker  - resnext50_32x4d
158*da0073e9SAndroid Build Coastguard Worker
159*da0073e9SAndroid Build Coastguard Worker
160*da0073e9SAndroid Build Coastguard Workerskip:
161*da0073e9SAndroid Build Coastguard Worker  all:
162*da0073e9SAndroid Build Coastguard Worker    # OOMs (A100 40G)
163*da0073e9SAndroid Build Coastguard Worker    - detectron2_maskrcnn
164*da0073e9SAndroid Build Coastguard Worker    # TIMEOUT, https://github.com/pytorch/pytorch/issues/98467
165*da0073e9SAndroid Build Coastguard Worker    - tacotron2
166*da0073e9SAndroid Build Coastguard Worker    # Failing in eager mode
167*da0073e9SAndroid Build Coastguard Worker    - hf_clip
168*da0073e9SAndroid Build Coastguard Worker    # multi gpu not always available in benchmark runners
169*da0073e9SAndroid Build Coastguard Worker    - simple_gpt_tp_manual
170*da0073e9SAndroid Build Coastguard Worker
171*da0073e9SAndroid Build Coastguard Worker  device:
172*da0073e9SAndroid Build Coastguard Worker    cpu:
173*da0073e9SAndroid Build Coastguard Worker      # OOMs
174*da0073e9SAndroid Build Coastguard Worker      - hf_T5_generate
175*da0073e9SAndroid Build Coastguard Worker      # model is CUDA only
176*da0073e9SAndroid Build Coastguard Worker      - cm3leon_generate
177*da0073e9SAndroid Build Coastguard Worker      # timeout
178*da0073e9SAndroid Build Coastguard Worker      - nanogpt
179*da0073e9SAndroid Build Coastguard Worker      # timeout
180*da0073e9SAndroid Build Coastguard Worker      - sam
181*da0073e9SAndroid Build Coastguard Worker      # model is CUDA only
182*da0073e9SAndroid Build Coastguard Worker      - sam_fast
183*da0073e9SAndroid Build Coastguard Worker      # model is CUDA only
184*da0073e9SAndroid Build Coastguard Worker      - llama_v2_7b_16h
185*da0073e9SAndroid Build Coastguard Worker      # flaky
186*da0073e9SAndroid Build Coastguard Worker      - stable_diffusion
187*da0073e9SAndroid Build Coastguard Worker      # requires FBGEMM, CUDA only
188*da0073e9SAndroid Build Coastguard Worker      - torchrec_dlrm
189*da0073e9SAndroid Build Coastguard Worker      - simple_gpt
190*da0073e9SAndroid Build Coastguard Worker      # works on cuda, accuracy failure on cpu
191*da0073e9SAndroid Build Coastguard Worker      - hf_Whisper
192*da0073e9SAndroid Build Coastguard Worker      - stable_diffusion_text_encoder
193*da0073e9SAndroid Build Coastguard Worker      - llava
194*da0073e9SAndroid Build Coastguard Worker      - moco
195*da0073e9SAndroid Build Coastguard Worker
196*da0073e9SAndroid Build Coastguard Worker    cuda: []
197*da0073e9SAndroid Build Coastguard Worker
198*da0073e9SAndroid Build Coastguard Worker  test:
199*da0073e9SAndroid Build Coastguard Worker    training:
200*da0073e9SAndroid Build Coastguard Worker      - *DETECTRON2_MODELS
201*da0073e9SAndroid Build Coastguard Worker      # not designed for training
202*da0073e9SAndroid Build Coastguard Worker      - pyhpc_equation_of_state
203*da0073e9SAndroid Build Coastguard Worker      - pyhpc_isoneutral_mixing
204*da0073e9SAndroid Build Coastguard Worker      - pyhpc_turbulent_kinetic_energy
205*da0073e9SAndroid Build Coastguard Worker      - maml
206*da0073e9SAndroid Build Coastguard Worker      - llama
207*da0073e9SAndroid Build Coastguard Worker      - llama_v2_7b_16h
208*da0073e9SAndroid Build Coastguard Worker      - simple_gpt
209*da0073e9SAndroid Build Coastguard Worker      - sam_fast
210*da0073e9SAndroid Build Coastguard Worker      # Model's DEFAULT_TRAIN_BSIZE is not implemented
211*da0073e9SAndroid Build Coastguard Worker      - cm3leon_generate
212*da0073e9SAndroid Build Coastguard Worker      - hf_T5_generate
213*da0073e9SAndroid Build Coastguard Worker      - doctr_det_predictor
214*da0073e9SAndroid Build Coastguard Worker      - doctr_reco_predictor
215*da0073e9SAndroid Build Coastguard Worker      - moondream
216*da0073e9SAndroid Build Coastguard Worker      # doesnt fit in memory
217*da0073e9SAndroid Build Coastguard Worker      - phi_1_5
218*da0073e9SAndroid Build Coastguard Worker      - detectron2_fcos_r_50_fpn
219*da0073e9SAndroid Build Coastguard Worker
220*da0073e9SAndroid Build Coastguard Worker  control_flow:
221*da0073e9SAndroid Build Coastguard Worker    - cm3leon_generate
222*da0073e9SAndroid Build Coastguard Worker    - detectron2_fcos_r_50_fpn
223*da0073e9SAndroid Build Coastguard Worker    - fastNLP_Bert
224*da0073e9SAndroid Build Coastguard Worker    - hf_Longformer
225*da0073e9SAndroid Build Coastguard Worker    - hf_Reformer
226*da0073e9SAndroid Build Coastguard Worker    - hf_T5_generate
227*da0073e9SAndroid Build Coastguard Worker    - opacus_cifar10
228*da0073e9SAndroid Build Coastguard Worker    - speech_transformer
229*da0073e9SAndroid Build Coastguard Worker
230*da0073e9SAndroid Build Coastguard Worker  # Models that should only run in --multiprocess mode
231*da0073e9SAndroid Build Coastguard Worker  multiprocess:
232*da0073e9SAndroid Build Coastguard Worker    - simple_gpt
233*da0073e9SAndroid Build Coastguard Worker
234*da0073e9SAndroid Build Coastguard Worker  # for these models, conv-batchnorm fusing causes big numerical churn.
235*da0073e9SAndroid Build Coastguard Worker  # Skip them
236*da0073e9SAndroid Build Coastguard Worker  # mnasnet1_0 and shufflenet_v2_x1_0 can pass on cpu, moco cuda only.
237*da0073e9SAndroid Build Coastguard Worker  freezing:
238*da0073e9SAndroid Build Coastguard Worker    cuda:
239*da0073e9SAndroid Build Coastguard Worker      - mnasnet1_0
240*da0073e9SAndroid Build Coastguard Worker      - moco
241*da0073e9SAndroid Build Coastguard Worker      - shufflenet_v2_x1_0
242*da0073e9SAndroid Build Coastguard Worker    cpu: []
243*da0073e9SAndroid Build Coastguard Worker
244*da0073e9SAndroid Build Coastguard Worker
245*da0073e9SAndroid Build Coastguard Worker
246*da0073e9SAndroid Build Coastguard Worker
247*da0073e9SAndroid Build Coastguard Workeraccuracy:
248*da0073e9SAndroid Build Coastguard Worker  skip:
249*da0073e9SAndroid Build Coastguard Worker    large_models:
250*da0073e9SAndroid Build Coastguard Worker      # Models too large to have eager, dynamo and fp64_numbers simultaneosuly
251*da0073e9SAndroid Build Coastguard Worker      # even for 40 GB machine. We have tested accuracy for smaller version of
252*da0073e9SAndroid Build Coastguard Worker      # these models
253*da0073e9SAndroid Build Coastguard Worker      - hf_GPT2_large
254*da0073e9SAndroid Build Coastguard Worker      - hf_T5_large
255*da0073e9SAndroid Build Coastguard Worker      - timm_vision_transformer_large
256*da0073e9SAndroid Build Coastguard Worker      # accuracy https://github.com/pytorch/pytorch/issues/93847
257*da0073e9SAndroid Build Coastguard Worker      - maml
258*da0073e9SAndroid Build Coastguard Worker      - llama_v2_7b_16h
259*da0073e9SAndroid Build Coastguard Worker      - Background_Matting
260*da0073e9SAndroid Build Coastguard Worker      - stable_diffusion_unet
261*da0073e9SAndroid Build Coastguard Worker    eager_not_deterministic:
262*da0073e9SAndroid Build Coastguard Worker      # Models that deterministic algorithms can not be turned on for eager mode.
263*da0073e9SAndroid Build Coastguard Worker      - Background_Matting
264*da0073e9SAndroid Build Coastguard Worker      - pytorch_unet
265*da0073e9SAndroid Build Coastguard Worker
266*da0073e9SAndroid Build Coastguard Worker  max_batch_size:
267*da0073e9SAndroid Build Coastguard Worker    hf_GPT2: 2
268*da0073e9SAndroid Build Coastguard Worker    pytorch_unet: 2
269