| { | |
| "Qwen/Qwen2.5-7B-Instruct": [ | |
| { | |
| "batch_size": 1, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 4, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 8, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 1, | |
| "sequence_length": 4096, | |
| "num_cores": 8, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 32, | |
| "sequence_length": 4096, | |
| "num_cores": 8, | |
| "auto_cast_type": "bf16" | |
| } | |
| ], | |
| "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B": [ | |
| { | |
| "batch_size": 1, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 4, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 8, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 1, | |
| "sequence_length": 4096, | |
| "num_cores": 8, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 32, | |
| "sequence_length": 4096, | |
| "num_cores": 8, | |
| "auto_cast_type": "bf16" | |
| } | |
| ], | |
| "Qwen/Qwen2.5-0.5B": [ | |
| { | |
| "batch_size": 1, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 4, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| } | |
| ], | |
| "Qwen/Qwen2.5-1.5B": [ | |
| { | |
| "batch_size": 1, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 4, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| } | |
| ], | |
| "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B": [ | |
| { | |
| "batch_size": 1, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 4, | |
| "sequence_length": 4096, | |
| "num_cores": 2, | |
| "auto_cast_type": "bf16" | |
| } | |
| ], | |
| "Qwen/Qwen2.5-14B": [ | |
| { | |
| "batch_size": 1, | |
| "sequence_length": 4096, | |
| "num_cores": 8, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 16, | |
| "sequence_length": 4096, | |
| "num_cores": 8, | |
| "auto_cast_type": "bf16" | |
| } | |
| ], | |
| "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B": [ | |
| { | |
| "batch_size": 1, | |
| "sequence_length": 4096, | |
| "num_cores": 8, | |
| "auto_cast_type": "bf16" | |
| }, | |
| { | |
| "batch_size": 16, | |
| "sequence_length": 4096, | |
| "num_cores": 8, | |
| "auto_cast_type": "bf16" | |
| } | |
| ] | |
| } |