-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathunet_1_77_512_512_fp16_stable-diffusion-v1-4_vulkan_rdna3_configs.json
14 lines (14 loc) · 4.64 KB
/
unet_1_77_512_512_fp16_stable-diffusion-v1-4_vulkan_rdna3_configs.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
{"options": [{"work_group_tile_sizes": [1, 32, 64], "parallel_tile_sizes": [1, 32, 32], "reduction_tile_sizes": [0, 0, 0, 32], "work_group_sizes": [64, 1, 1], "pipeline": "SPIRVCooperativeMatrixVectorize", "subgroup_size": 32, "vector_tile_sizes": [1, 16, 16, 16], "pipeline_depth": 0, "store_stage": 0}], "identifier": "bmm", "b": 36, "m": 128, "n": 640, "k": 960}
{"options": [{"work_group_tile_sizes": [1, 32, 64], "parallel_tile_sizes": [1, 32, 32], "reduction_tile_sizes": [0, 0, 0, 64], "work_group_sizes": [64, 1, 1], "pipeline": "SPIRVCooperativeMatrixVectorize", "subgroup_size": 32, "vector_tile_sizes": [1, 16, 16, 16], "pipeline_depth": 0, "store_stage": 0}], "identifier": "generic", "b": 2, "m": 640, "n": 1024, "k": 960}
{"options": [{"work_group_tile_sizes": [1, 64, 64], "parallel_tile_sizes": [1, 32, 64], "reduction_tile_sizes": [0, 0, 0, 32], "work_group_sizes": [32, 2, 1], "pipeline": "SPIRVCooperativeMatrixVectorize", "subgroup_size": 32, "vector_tile_sizes": [1, 16, 16, 16], "pipeline_depth": 0, "store_stage": 0}], "identifier": "bmm", "b": 36, "m": 512, "n": 640, "k": 640}
{"options": [{"work_group_tile_sizes": [1, 64, 64], "parallel_tile_sizes": [1, 32, 32], "reduction_tile_sizes": [0, 0, 0, 32], "work_group_sizes": [64, 2, 1], "pipeline": "SPIRVCooperativeMatrixVectorize", "subgroup_size": 32, "vector_tile_sizes": [1, 16, 16, 16], "pipeline_depth": 0, "store_stage": 0}], "identifier": "bmm", "b": 36, "m": 512, "n": 320, "k": 960}
{"options": [{"work_group_tile_sizes": [1, 64, 32], "parallel_tile_sizes": [1, 32, 32], "reduction_tile_sizes": [0, 0, 0, 32], "work_group_sizes": [32, 2, 1], "pipeline": "SPIRVCooperativeMatrixVectorize", "subgroup_size": 32, "vector_tile_sizes": [1, 16, 16, 16], "pipeline_depth": 0, "store_stage": 0}], "identifier": "generic", "b": 2, "m": 320, "n": 4096, "k": 960}
{"options": [{"work_group_tile_sizes": [1, 64, 64], "parallel_tile_sizes": [1, 32, 32], "reduction_tile_sizes": [0, 0, 0, 64], "work_group_sizes": [64, 2, 1], "pipeline": "SPIRVCooperativeMatrixVectorize", "subgroup_size": 32, "vector_tile_sizes": [1, 16, 16, 16], "pipeline_depth": 0, "store_stage": 0}], "identifier": "bmm", "b": 36, "m": 512, "n": 320, "k": 640}
{"options": [{"work_group_tile_sizes": [1, 64, 64], "parallel_tile_sizes": [1, 32, 32], "reduction_tile_sizes": [0, 0, 0, 64], "work_group_sizes": [64, 2, 1], "pipeline": "SPIRVCooperativeMatrixVectorize", "subgroup_size": 32, "vector_tile_sizes": [1, 16, 16, 16], "pipeline_depth": 0, "store_stage": 0}], "identifier": "generic", "b": 2, "m": 320, "n": 4096, "k": 640}
{"options": [{"work_group_tile_sizes": [1, 32, 64], "parallel_tile_sizes": [1, 2, 4], "reduction_tile_sizes": [0, 0, 0, 4], "work_group_sizes": [16, 16, 1], "pipeline": "SPIRVMatmulPromoteVectorize", "subgroup_size": 64, "pipeline_depth": 1, "store_stage": 0}], "identifier": "generic", "b": 2, "m": 320, "n": 4096, "k": 36}
{"options": [{"work_group_tile_sizes": [1, 4, 64], "parallel_tile_sizes": [1, 1, 4], "reduction_tile_sizes": [0, 0, 0, 4], "work_group_sizes": [16, 4, 1], "pipeline": "SPIRVMatmulPromoteVectorize", "subgroup_size": 64, "pipeline_depth": 1, "store_stage": 0}], "identifier": "generic", "b": 2, "m": 4, "n": 4096, "k": 2880}
{"options": [null], "identifier": "matmul", "b": 0, "m": 2, "n": 640, "k": 1280}
{"options": [{"work_group_tile_sizes": [32, 64], "parallel_tile_sizes": [32, 32], "reduction_tile_sizes": [0, 0, 64], "work_group_sizes": [64, 1, 1], "pipeline": "SPIRVCooperativeMatrixVectorize", "subgroup_size": 32, "vector_tile_sizes": [16, 16, 16], "pipeline_depth": 0, "store_stage": 0}], "identifier": "matmul", "b": 0, "m": 2048, "n": 640, "k": 640}
{"options": [{"work_group_tile_sizes": [1, 32, 64], "parallel_tile_sizes": [1, 32, 32], "reduction_tile_sizes": [0, 0, 0, 64], "work_group_sizes": [64, 1, 1], "pipeline": "SPIRVCooperativeMatrixVectorize", "subgroup_size": 32, "vector_tile_sizes": [1, 16, 16, 16], "pipeline_depth": 0, "store_stage": 0}], "identifier": "generic", "b": 2, "m": 320, "n": 1024, "k": 2880}
{"options": [{"work_group_tile_sizes": [1, 64, 64], "parallel_tile_sizes": [1, 32, 32], "reduction_tile_sizes": [0, 0, 0, 64], "work_group_sizes": [64, 2, 1], "pipeline": "SPIRVCooperativeMatrixVectorize", "subgroup_size": 32, "vector_tile_sizes": [1, 16, 16, 16], "pipeline_depth": 0, "store_stage": 0}], "identifier": "bmm", "b": 36, "m": 128, "n": 640, "k": 320}
{"options": [{"work_group_tile_sizes": [16, 32], "parallel_tile_sizes": [16, 16], "reduction_tile_sizes": [0, 0, 64], "work_group_sizes": [64, 1, 1], "pipeline": "SPIRVCooperativeMatrixVectorize", "subgroup_size": 32, "vector_tile_sizes": [16, 16, 16], "pipeline_depth": 1, "store_stage": 0}], "identifier": "matmul", "b": 0, "m": 32, "n": 640, "k": 1280}