@@ -741,20 +741,18 @@ jobs:
741
741
id-token : write
742
742
contents : read
743
743
secrets : inherit
744
- # Models below selected based on https://huggingface.co/models?pipeline_tag=text-generation&num_parameters=min:0,max:3B&sort=trending.
745
- xnnpack : &xnnpack
746
- - llama3.2-1b|xnnpack|--quantize
747
- - qwen3-0.6b|xnnpack|--quantize
748
- - qwen3-1.7b|xnnpack|--quantize
749
- - gemma3-1b|xnnpack|--quantize
750
- - phi-4-mini|xnnpack|--quantize
751
- - smollm2-135m|xnnpack|--quantize
752
- - smollm3-3b|xnnpack|--quantize
753
744
strategy :
754
745
matrix :
755
- config :
756
- - *xnnpack
757
- - *coreml
746
+ config : [
747
+ # XNNPack.
748
+ llama3.2-1b|xnnpack|--quantize,
749
+ qwen3-0.6b|xnnpack|--quantize,
750
+ qwen3-1.7b|xnnpack|--quantize,
751
+ gemma3-1b|xnnpack|--quantize,
752
+ phi-4-mini|xnnpack|--quantize,
753
+ smollm2-135m|xnnpack|--quantize,
754
+ smollm3-3b|xnnpack|--quantize
755
+ ]
758
756
fail-fast : false
759
757
with :
760
758
secrets-env : EXECUTORCH_HF_TOKEN
@@ -834,28 +832,26 @@ jobs:
834
832
contents : read
835
833
secrets : inherit
836
834
# Models below selected based on https://huggingface.co/models?pipeline_tag=text-generation&num_parameters=min:0,max:3B&sort=trending.
837
- xnnpack : &xnnpack
838
- - llama3.2-1b|xnnpack|--quantize
839
- - qwen3-0.6b|xnnpack|--quantize
840
- - qwen3-1.7b|xnnpack|--quantize
841
- - gemma3-1b|xnnpack|--quantize
842
- - phi-4-mini|xnnpack|--quantize
843
- - smollm2-135m|xnnpack|--quantize
844
- - smollm3-3b|xnnpack|--quantize
845
- coreml : &coreml
846
- - llama3.2-1b|coreml_fp32_gpu|--quantize,
847
- - qwen3-0.6b|coreml_fp32_gpu|--quantize,
848
- - qwen3-0.6b|coreml_fp32_gpu|--quantize,
849
- - smollm2-135m|coreml_fp32_gpu|--quantize,
850
- - olmo-1b|coreml_fp32_gpu|--quantize,
851
- # - roberta|coreml_fp32_gpu|--quantize, roberta requires special HF access
852
- - bert|coreml_fp32_gpu|--quantize,
853
- - distilbert|coreml_fp32_gpu|--quantize,
854
835
strategy :
855
836
matrix :
856
- config :
857
- - *xnnpack
858
- - *coreml
837
+ config : [
838
+ # XNNPack.
839
+ llama3.2-1b|xnnpack|--quantize,
840
+ qwen3-0.6b|xnnpack|--quantize,
841
+ qwen3-1.7b|xnnpack|--quantize,
842
+ gemma3-1b|xnnpack|--quantize,
843
+ phi-4-mini|xnnpack|--quantize,
844
+ smollm2-135m|xnnpack|--quantize,
845
+ smollm3-3b|xnnpack|--quantize,
846
+ # CoreML.
847
+ llama3.2-1b|coreml_fp32_gpu|--quantize,
848
+ qwen3-0.6b|coreml_fp32_gpu|--quantize,
849
+ qwen3-1.7b|xnnpack|--quantize,
850
+ smollm2-135m|coreml_fp32_gpu|--quantize,
851
+ olmo-1b|coreml_fp32_gpu|--quantize,
852
+ bert|coreml_fp32_gpu|--quantize,
853
+ distilbert|coreml_fp32_gpu|--quantize
854
+ ]
859
855
fail-fast : false
860
856
with :
861
857
secrets-env : EXECUTORCH_HF_TOKEN
0 commit comments