intel
diff --git a/‎.ci/benchmarks/huggingface.yaml‎
Lines changed: 104 additions & 0 deletions b/‎.ci/benchmarks/huggingface.yaml‎
Lines changed: 104 additions & 0 deletions
diff --git a/‎.ci/benchmarks/huggingface_models_list.txt‎
Lines changed: 55 additions & 0 deletions b/‎.ci/benchmarks/huggingface_models_list.txt‎
Lines changed: 55 additions & 0 deletions
diff --git a/‎.ci/benchmarks/timm_models.yaml‎
Lines changed: 13 additions & 0 deletions b/‎.ci/benchmarks/timm_models.yaml‎
Lines changed: 13 additions & 0 deletions
diff --git a/‎.ci/benchmarks/timm_models_list.txt‎
Lines changed: 61 additions & 0 deletions b/‎.ci/benchmarks/timm_models_list.txt‎
Lines changed: 61 additions & 0 deletions
@@ -0,0 +1,104 @@
+skip:
+  all:
+    # Difficult to setup accuracy test because .eval() not supported
+    - Reformer
+    # Fails deepcopy
+    - BlenderbotForConditionalGeneration
+    - GPTNeoForCausalLM
+    - GPTNeoForSequenceClassification
+    # Fails with even batch size = 1
+    - GPTJForCausalLM
+    - GPTJForQuestionAnswering
+    # Model too big
+    - google/gemma-3-4b-it
+    - openai/gpt-oss-20b
+    - mistralai/Mistral-7B-Instruct-v0.3
+    # Fails due to pytorch #164815 removed it
+    - CamemBert
+
+  device:
+    cpu:
+      - meta-llama/Llama-3.2-1B
+      - google/gemma-2-2b
+      - google/gemma-3-4b-it
+      - openai/whisper-tiny
+      - Qwen/Qwen3-0.6B
+      - mistralai/Mistral-7B-Instruct-v0.3
+      - openai/gpt-oss-20b
+
+  control_flow:
+    - AllenaiLongformerBase
+
+batch_size:
+  # TODO - Fails even after fake tensors
+  divisors:
+    AlbertForMaskedLM: 2
+    AllenaiLongformerBase: 2
+    BartForCausalLM: 2
+    BertForMaskedLM: 2
+    BlenderbotForCausalLM: 8
+    # BlenderbotForConditionalGeneration : 16
+    DebertaV2ForMaskedLM: 4
+    DistilBertForMaskedLM: 2
+    DistillGPT2: 2
+    ElectraForCausalLM: 2
+    GPT2ForSequenceClassification: 2
+    # GPTJForCausalLM : 2
+    # GPTJForQuestionAnswering : 2
+    # GPTNeoForCausalLM : 32
+    # GPTNeoForSequenceClassification : 2
+    GoogleFnet: 2
+    LayoutLMForMaskedLM: 2
+    M2M100ForConditionalGeneration: 4
+    MBartForCausalLM: 2
+    MT5ForConditionalGeneration: 2
+    MegatronBertForCausalLM: 4
+    MobileBertForMaskedLM: 2
+    OPTForCausalLM: 2
+    PLBartForCausalLM: 2
+    PegasusForCausalLM: 4
+    RobertaForCausalLM: 2
+    T5ForConditionalGeneration: 2
+    T5Small: 2
+    TrOCRForCausalLM: 2
+    XGLMForCausalLM: 4
+    XLNetLMHeadModel: 2
+    YituTechConvBert: 2
+    meta-llama/Llama-3.2-1B: 8
+    google/gemma-2-2b: 8
+    google/gemma-3-4b-it: 8
+    openai/whisper-tiny: 8
+    Qwen/Qwen3-0.6B: 8
+    mistralai/Mistral-7B-Instruct-v0.3: 8
+    openai/gpt-oss-20b: 8
+
+
+tolerance:
+  higher_training:
+    - MT5ForConditionalGeneration
+
+  higher_max_autotune_training: []
+
+  higher_inference:
+    - GPT2ForSequenceClassification
+
+  higher_inference_cpu:
+    - GPT2ForSequenceClassification
+
+  cosine: []
+
+
+accuracy:
+  skip:
+    large_models:
+      # Models too large to have eager, dynamo and fp64_numbers simultaneously
+      # even for 40 GB machine.
+      - DebertaV2ForMaskedLM
+      - BlenderbotForCausalLM
+
+only_inference:
+  # Fails with dynamo for train mode
+  - M2M100ForConditionalGeneration
+
+only_fp32:
+  - GoogleFnet
@@ -0,0 +1,55 @@
+AlbertForMaskedLM,8
+AlbertForQuestionAnswering,8
+AllenaiLongformerBase,8
+BartForCausalLM,8
+BartForConditionalGeneration,4
+BertForMaskedLM,32
+BertForQuestionAnswering,32
+BlenderbotForCausalLM,32
+BlenderbotForConditionalGeneration,16
+BlenderbotSmallForCausalLM,256
+BlenderbotSmallForConditionalGeneration,128
+CamemBert,32
+DebertaV2ForMaskedLM,8
+DebertaV2ForQuestionAnswering,8
+DistilBertForMaskedLM,256
+DistilBertForQuestionAnswering,512
+DistillGPT2,32
+ElectraForCausalLM,64
+ElectraForQuestionAnswering,128
+GPT2ForSequenceClassification,8
+GPTJForCausalLM,1
+GPTJForQuestionAnswering,1
+GPTNeoForCausalLM,32
+GPTNeoForSequenceClassification,32
+GoogleFnet,32
+LayoutLMForMaskedLM,32
+LayoutLMForSequenceClassification,32
+M2M100ForConditionalGeneration,64
+MBartForCausalLM,8
+MBartForConditionalGeneration,4
+MT5ForConditionalGeneration,32
+MegatronBertForCausalLM,16
+MegatronBertForQuestionAnswering,16
+MobileBertForMaskedLM,256
+MobileBertForQuestionAnswering,256
+OPTForCausalLM,4
+PLBartForCausalLM,16
+PLBartForConditionalGeneration,8
+PegasusForCausalLM,128
+PegasusForConditionalGeneration,64
+RobertaForCausalLM,32
+RobertaForQuestionAnswering,32
+T5ForConditionalGeneration,8
+T5Small,8
+TrOCRForCausalLM,64
+XGLMForCausalLM,32
+XLNetLMHeadModel,16
+YituTechConvBert,32
+meta-llama/Llama-3.2-1B,8
+google/gemma-2-2b,8
+google/gemma-3-4b-it,8
+openai/whisper-tiny,8
+Qwen/Qwen3-0.6B,8
+mistralai/Mistral-7B-Instruct-v0.3,8
+openai/gpt-oss-20b,8
@@ -0,0 +1,13 @@
+# removing this file prevents the TimmRunner from dynamically skipping models
+skip:
+  all:
+    - ~
+  device:
+    cpu:
+      - ~
+    # Skip these additional models when running on aarch64
+    cpu_aarch64:
+      # timeout on aarch64
+      - dm_nfnet_f0
+      - nfnet_l0
+      - visformer_small
@@ -0,0 +1,61 @@
+adv_inception_v3 128
+beit_base_patch16_224 128
+botnet26t_256 128
+cait_m36_384 4
+coat_lite_mini 128
+convit_base 128
+convmixer_768_32 64
+convnext_base 128
+crossvit_9_240 256
+cspdarknet53 128
+deit_base_distilled_patch16_224 128
+dla102 128
+dm_nfnet_f0 128
+dpn107 64
+eca_botnext26ts_256 128
+eca_halonext26ts 128
+ese_vovnet19b_dw 256
+fbnetc_100 512
+fbnetv3_b 256
+gernet_l 128
+ghostnet_100 512
+gluon_inception_v3 256
+gmixer_24_224 128
+gmlp_s16_224 128
+hrnet_w18 128
+inception_v3 128
+jx_nest_base 128
+lcnet_050 256
+levit_128 1024
+mixer_b16_224 128
+mixnet_l 128
+mnasnet_100 512
+mobilenetv2_100 128
+mobilenetv3_large_100 512
+mobilevit_s 128
+nfnet_l0 128
+pit_b_224 64
+pnasnet5large 32
+poolformer_m36 128
+regnety_002 1024
+repvgg_a2 128
+res2net101_26w_4s 128
+res2net50_14w_8s 128
+res2next50 128
+resmlp_12_224 128
+resnest101e 128
+rexnet_100 256
+sebotnet33ts_256 64
+selecsls42b 128
+spnasnet_100 128
+swin_base_patch4_window7_224 128
+swsl_resnext101_32x16d 64
+tf_efficientnet_b0 128
+tf_mixnet_l 128
+tinynet_a 128
+tnt_s_patch16_224 128
+twins_pcpvt_base 128
+visformer_small 128
+vit_base_patch16_224 128
+volo_d1_224 128
+xcit_large_24_p8_224 16