xref: /aosp_15_r20/external/pytorch/benchmarks/dynamo/huggingface.yaml (revision da0073e96a02ea20f0ac840b70461e3646d07c45)
1*da0073e9SAndroid Build Coastguard Workerskip:
2*da0073e9SAndroid Build Coastguard Worker  all:
3*da0073e9SAndroid Build Coastguard Worker    # Difficult to setup accuracy test because .eval() not supported
4*da0073e9SAndroid Build Coastguard Worker    - Reformer
5*da0073e9SAndroid Build Coastguard Worker    # Fails deepcopy
6*da0073e9SAndroid Build Coastguard Worker    - BlenderbotForConditionalGeneration
7*da0073e9SAndroid Build Coastguard Worker    - GPTNeoForCausalLM
8*da0073e9SAndroid Build Coastguard Worker    - GPTNeoForSequenceClassification
9*da0073e9SAndroid Build Coastguard Worker    # Fails with even batch size = 1
10*da0073e9SAndroid Build Coastguard Worker    - GPTJForCausalLM
11*da0073e9SAndroid Build Coastguard Worker    - GPTJForQuestionAnswering
12*da0073e9SAndroid Build Coastguard Worker
13*da0073e9SAndroid Build Coastguard Worker  device:
14*da0073e9SAndroid Build Coastguard Worker    cpu: []
15*da0073e9SAndroid Build Coastguard Worker
16*da0073e9SAndroid Build Coastguard Worker  control_flow:
17*da0073e9SAndroid Build Coastguard Worker    - AllenaiLongformerBase
18*da0073e9SAndroid Build Coastguard Worker
19*da0073e9SAndroid Build Coastguard Workerbatch_size:
20*da0073e9SAndroid Build Coastguard Worker  # TODO - Fails even after fake tensors
21*da0073e9SAndroid Build Coastguard Worker  divisors:
22*da0073e9SAndroid Build Coastguard Worker    AlbertForMaskedLM: 2
23*da0073e9SAndroid Build Coastguard Worker    AlbertForQuestionAnswering: 2
24*da0073e9SAndroid Build Coastguard Worker    AllenaiLongformerBase: 2
25*da0073e9SAndroid Build Coastguard Worker    BartForCausalLM: 2
26*da0073e9SAndroid Build Coastguard Worker    BartForConditionalGeneration: 2
27*da0073e9SAndroid Build Coastguard Worker    BertForMaskedLM: 2
28*da0073e9SAndroid Build Coastguard Worker    BertForQuestionAnswering: 2
29*da0073e9SAndroid Build Coastguard Worker    BlenderbotForCausalLM: 8
30*da0073e9SAndroid Build Coastguard Worker    # BlenderbotForConditionalGeneration : 16
31*da0073e9SAndroid Build Coastguard Worker    BlenderbotSmallForCausalLM: 4
32*da0073e9SAndroid Build Coastguard Worker    BlenderbotSmallForConditionalGeneration: 2
33*da0073e9SAndroid Build Coastguard Worker    CamemBert: 2
34*da0073e9SAndroid Build Coastguard Worker    DebertaForMaskedLM: 4
35*da0073e9SAndroid Build Coastguard Worker    DebertaForQuestionAnswering: 2
36*da0073e9SAndroid Build Coastguard Worker    DebertaV2ForMaskedLM: 4
37*da0073e9SAndroid Build Coastguard Worker    DebertaV2ForQuestionAnswering: 8
38*da0073e9SAndroid Build Coastguard Worker    DistilBertForMaskedLM: 2
39*da0073e9SAndroid Build Coastguard Worker    DistilBertForQuestionAnswering: 2
40*da0073e9SAndroid Build Coastguard Worker    DistillGPT2: 2
41*da0073e9SAndroid Build Coastguard Worker    ElectraForCausalLM: 2
42*da0073e9SAndroid Build Coastguard Worker    ElectraForQuestionAnswering: 2
43*da0073e9SAndroid Build Coastguard Worker    GPT2ForSequenceClassification: 2
44*da0073e9SAndroid Build Coastguard Worker    # GPTJForCausalLM : 2
45*da0073e9SAndroid Build Coastguard Worker    # GPTJForQuestionAnswering : 2
46*da0073e9SAndroid Build Coastguard Worker    # GPTNeoForCausalLM : 32
47*da0073e9SAndroid Build Coastguard Worker    # GPTNeoForSequenceClassification : 2
48*da0073e9SAndroid Build Coastguard Worker    GoogleFnet: 2
49*da0073e9SAndroid Build Coastguard Worker    LayoutLMForMaskedLM: 2
50*da0073e9SAndroid Build Coastguard Worker    LayoutLMForSequenceClassification: 2
51*da0073e9SAndroid Build Coastguard Worker    M2M100ForConditionalGeneration: 4
52*da0073e9SAndroid Build Coastguard Worker    MBartForCausalLM: 2
53*da0073e9SAndroid Build Coastguard Worker    MBartForConditionalGeneration: 2
54*da0073e9SAndroid Build Coastguard Worker    MT5ForConditionalGeneration: 2
55*da0073e9SAndroid Build Coastguard Worker    MegatronBertForCausalLM: 4
56*da0073e9SAndroid Build Coastguard Worker    MegatronBertForQuestionAnswering: 2
57*da0073e9SAndroid Build Coastguard Worker    MobileBertForMaskedLM: 2
58*da0073e9SAndroid Build Coastguard Worker    MobileBertForQuestionAnswering: 2
59*da0073e9SAndroid Build Coastguard Worker    OPTForCausalLM: 2
60*da0073e9SAndroid Build Coastguard Worker    PLBartForCausalLM: 2
61*da0073e9SAndroid Build Coastguard Worker    PLBartForConditionalGeneration: 2
62*da0073e9SAndroid Build Coastguard Worker    PegasusForCausalLM: 4
63*da0073e9SAndroid Build Coastguard Worker    PegasusForConditionalGeneration: 2
64*da0073e9SAndroid Build Coastguard Worker    RobertaForCausalLM: 2
65*da0073e9SAndroid Build Coastguard Worker    RobertaForQuestionAnswering: 2
66*da0073e9SAndroid Build Coastguard Worker    Speech2Text2ForCausalLM: 4
67*da0073e9SAndroid Build Coastguard Worker    T5ForConditionalGeneration: 2
68*da0073e9SAndroid Build Coastguard Worker    T5Small: 2
69*da0073e9SAndroid Build Coastguard Worker    TrOCRForCausalLM: 2
70*da0073e9SAndroid Build Coastguard Worker    XGLMForCausalLM: 4
71*da0073e9SAndroid Build Coastguard Worker    XLNetLMHeadModel: 2
72*da0073e9SAndroid Build Coastguard Worker    YituTechConvBert: 2
73*da0073e9SAndroid Build Coastguard Worker
74*da0073e9SAndroid Build Coastguard Worker
75*da0073e9SAndroid Build Coastguard Workertolerance:
76*da0073e9SAndroid Build Coastguard Worker  higher_training:
77*da0073e9SAndroid Build Coastguard Worker    - MT5ForConditionalGeneration
78*da0073e9SAndroid Build Coastguard Worker    # AlbertForQuestionAnswering fails in CI GCP A100 but error does not seem
79*da0073e9SAndroid Build Coastguard Worker    # harmful.
80*da0073e9SAndroid Build Coastguard Worker    - AlbertForQuestionAnswering
81*da0073e9SAndroid Build Coastguard Worker
82*da0073e9SAndroid Build Coastguard Worker  higher_max_autotune_training:
83*da0073e9SAndroid Build Coastguard Worker    # DebertaForQuestionAnswering needs higher tolerance in Max-Autotune mode
84*da0073e9SAndroid Build Coastguard Worker    - DebertaForQuestionAnswering
85*da0073e9SAndroid Build Coastguard Worker
86*da0073e9SAndroid Build Coastguard Worker  higher_inference:
87*da0073e9SAndroid Build Coastguard Worker    - GPT2ForSequenceClassification
88*da0073e9SAndroid Build Coastguard Worker    - RobertaForQuestionAnswering
89*da0073e9SAndroid Build Coastguard Worker
90*da0073e9SAndroid Build Coastguard Worker  higher_inference_cpu:
91*da0073e9SAndroid Build Coastguard Worker    - LayoutLMForSequenceClassification
92*da0073e9SAndroid Build Coastguard Worker
93*da0073e9SAndroid Build Coastguard Worker  cosine: []
94*da0073e9SAndroid Build Coastguard Worker
95*da0073e9SAndroid Build Coastguard Worker
96*da0073e9SAndroid Build Coastguard Workeraccuracy:
97*da0073e9SAndroid Build Coastguard Worker  skip:
98*da0073e9SAndroid Build Coastguard Worker    large_models:
99*da0073e9SAndroid Build Coastguard Worker      # Models too large to have eager, dynamo and fp64_numbers simultaneously
100*da0073e9SAndroid Build Coastguard Worker      # even for 40 GB machine.
101*da0073e9SAndroid Build Coastguard Worker      - DebertaV2ForMaskedLM
102*da0073e9SAndroid Build Coastguard Worker      - BlenderbotForCausalLM
103*da0073e9SAndroid Build Coastguard Worker
104*da0073e9SAndroid Build Coastguard Workeronly_inference:
105*da0073e9SAndroid Build Coastguard Worker  # Fails with dynamo for train mode
106*da0073e9SAndroid Build Coastguard Worker  - M2M100ForConditionalGeneration
107*da0073e9SAndroid Build Coastguard Worker
108*da0073e9SAndroid Build Coastguard Workeronly_fp32:
109*da0073e9SAndroid Build Coastguard Worker  - GoogleFnet
110