Directory listing for /agent-env/lib/python3.11/site-packages/vllm/model_executor/layers/fused_moe/configs/
- E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json
- E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json
- E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json
- E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB.json
- E=1,N=1792,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json
- E=1,N=3072,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json
- E=1,N=3072,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json
- E=1,N=3072,device_name=NVIDIA_H100_80GB_HBM3.json
- E=1,N=3072,device_name=NVIDIA_H200,dtype=int8_w8a16.json
- E=1,N=3584,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json
- E=1,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json
- E=1,N=3584,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json
- E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json
- E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json
- E=1,N=7168,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json
- E=128,N=1024,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8.json
- E=128,N=1024,device_name=AMD_Instinct_MI300X.json
- E=128,N=1024,device_name=AMD_Instinct_MI325X,dtype=fp8_w8a8.json
- E=128,N=1024,device_name=NVIDIA_H100,dtype=fp8_w8a8.json
- E=128,N=1024,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=128,N=1024,device_name=NVIDIA_H200.json
- E=128,N=1856,device_name=NVIDIA_H100_80GB_HBM3.json
- E=128,N=1856,device_name=NVIDIA_L40S.json
- E=128,N=192,device_name=NVIDIA_A100-SXM4-80GB.json
- E=128,N=192,device_name=NVIDIA_H100_80GB_HBM3.json
- E=128,N=192,device_name=NVIDIA_H20-3e.json
- E=128,N=192,device_name=NVIDIA_H20.json
- E=128,N=192,device_name=NVIDIA_H200.json
- E=128,N=352,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=128,N=384,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=384,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=384,device_name=NVIDIA_GB200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=384,device_name=NVIDIA_H20,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=384,device_name=NVIDIA_H20-3e,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=384,device_name=NVIDIA_H20-3e.json
- E=128,N=384,device_name=NVIDIA_H20.json
- E=128,N=384,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=384,device_name=NVIDIA_H200.json
- E=128,N=512,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=512,device_name=NVIDIA_H100_80GB_HBM3.json
- E=128,N=512,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=128,N=704,device_name=NVIDIA_B200,dtype=fp8_w8a8.json
- E=128,N=704,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=128,N=704,device_name=NVIDIA_RTX_PRO_6000_Blackwell_Workstation_Edition,dtype=fp8_w8a8.json
- E=128,N=768,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=768,device_name=AMD_Instinct_MI308X.json
- E=128,N=768,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=768,device_name=NVIDIA_B200.json
- E=128,N=768,device_name=NVIDIA_GB200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=768,device_name=NVIDIA_H20,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=768,device_name=NVIDIA_H20-3e,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=768,device_name=NVIDIA_H20.json
- E=128,N=768,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=128,N=768,device_name=NVIDIA_H200.json
- E=128,N=8960,device_name=NVIDIA_H100_80GB_HBM3,dtype=bf16.json
- E=128,N=8960,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=128,N=928,device_name=NVIDIA_H100_80GB_HBM3.json
- E=128,N=928,device_name=NVIDIA_L40S.json
- E=128,N=96,device_name=NVIDIA_H20.json
- E=129,N=704,device_name=NVIDIA_RTX_PRO_6000_Blackwell_Workstation_Edition,dtype=fp8_w8a8.json
- E=16,N=1024,device_name=AMD_Instinct_MI300X.json
- E=16,N=1024,device_name=NVIDIA_B200,dtype=fp8_w8a8.json
- E=16,N=1024,device_name=NVIDIA_B200.json
- E=16,N=1024,device_name=NVIDIA_H100.json
- E=16,N=1024,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=16,N=1024,device_name=NVIDIA_H200.json
- E=16,N=1344,device_name=NVIDIA_A100-SXM4-40GB.json
- E=16,N=1344,device_name=NVIDIA_A100-SXM4-80GB.json
- E=16,N=1344,device_name=NVIDIA_H100_80GB_HBM3.json
- E=16,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json
- E=16,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json
- E=16,N=14336,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json
- E=16,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json
- E=16,N=1792,device_name=NVIDIA_A100-SXM4-80GB.json
- E=16,N=1792,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json
- E=16,N=1792,device_name=NVIDIA_H100_80GB_HBM3.json
- E=16,N=2048,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=16,N=2048,device_name=NVIDIA_H200.json
- E=16,N=2688,device_name=NVIDIA_A100-SXM4-80GB.json
- E=16,N=2688,device_name=NVIDIA_H100_80GB_HBM3.json
- E=16,N=3072,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json
- E=16,N=3072,device_name=NVIDIA_H100_80GB_HBM3,dtype=float8.json
- E=16,N=3072,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json
- E=16,N=3072,device_name=NVIDIA_H200,dtype=int8_w8a16.json
- E=16,N=3200,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=16,N=3584,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json
- E=16,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json
- E=16,N=3584,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json
- E=16,N=6400,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=16,N=7168,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json
- E=16,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json
- E=16,N=7168,device_name=NVIDIA_H100_80GB_HBM3,dtype=float8.json
- E=16,N=7168,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json
- E=16,N=800,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=160,N=192,device_name=AMD_Instinct_MI300X.json
- E=160,N=192,device_name=AMD_Instinct_MI350_OAM,dtype=fp8_w8a8.json
- E=160,N=192,device_name=NVIDIA_A800-SXM4-80GB.json
- E=160,N=192,device_name=NVIDIA_B300_SXM6_AC,dtype=fp8_w8a8.json
- E=160,N=192,device_name=NVIDIA_H20-3e.json
- E=160,N=192,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=160,N=320,device_name=NVIDIA_H20-3e.json
- E=160,N=384,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8.json
- E=160,N=384,device_name=AMD_Instinct_MI350_OAM,dtype=fp8_w8a8.json
- E=160,N=384,device_name=AMD_Instinct_MI355_OAM,dtype=fp8_w8a8.json
- E=160,N=384,device_name=NVIDIA_B300_SXM6_AC,dtype=fp8_w8a8.json
- E=160,N=640,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=160,N=640,device_name=NVIDIA_GB200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=160,N=640,device_name=NVIDIA_H100,dtype=fp8_w8a8,block_shape=[128,128].json
- E=160,N=768,device_name=NVIDIA_B300_SXM6_AC,dtype=fp8_w8a8.json
- E=20,N=1536,device_name=NVIDIA_RTX_PRO_6000_Blackwell_Server_Edition,dtype=fp8_w8a8.json
- E=20,N=2560,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=20,N=2560,device_name=NVIDIA_GB200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=20,N=2560,device_name=NVIDIA_H100,dtype=fp8_w8a8,block_shape=[128,128].json
- E=20,N=2560,device_name=NVIDIA_H20-3e,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=1024,device_name=AMD_Instinct_MI325_OAM,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=1024,device_name=AMD_Instinct_MI325X,block_shape=[128,128].json
- E=256,N=128,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a8,block_shape=[128,128].json
- E=256,N=128,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a8.json
- E=256,N=128,device_name=NVIDIA_A800-SXM4-80GB,dtype=int8_w8a8,block_shape=[128,128].json
- E=256,N=128,device_name=NVIDIA_A800-SXM4-80GB,dtype=int8_w8a8.json
- E=256,N=128,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=128,device_name=NVIDIA_H20,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=128,device_name=NVIDIA_L20Y,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=256,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=256,device_name=AMD_Instinct_MI325_OAM,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=256,device_name=AMD_Instinct_MI325X,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=256,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=256,device_name=NVIDIA_H20,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=256,device_name=NVIDIA_H20,dtype=int8_w8a8,block_shape=[128,128].json
- E=256,N=256,device_name=NVIDIA_H20-3e,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=256,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=256,device_name=NVIDIA_L20,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=384,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=512,device_name=AMD_Instinct_MI325_OAM,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=512,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=256,N=512,device_name=NVIDIA_H100_80GB_HBM3.json
- E=256,N=64,device_name=NVIDIA_A800-SXM4-80GB.json
- E=32,N=1408,device_name=NVIDIA_B200.json
- E=32,N=2048,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=32,N=2048,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=384,N=128,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=384,N=128,device_name=NVIDIA_GB200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=384,N=128,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=384,N=256,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=384,N=256,device_name=NVIDIA_GB200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=40,N=1536,device_name=NVIDIA_B200,dtype=fp8_w8a8.json
- E=40,N=2560,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=40,N=2560,device_name=NVIDIA_GB200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=40,N=2560,device_name=NVIDIA_H100,dtype=fp8_w8a8,block_shape=[128,128].json
- E=512,N=128,device_name=NVIDIA_A100-SXM4-80GB.json
- E=512,N=128,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=512,N=128,device_name=NVIDIA_B200.json
- E=512,N=128,device_name=NVIDIA_GB200,dtype=fp8_w8a8.json
- E=512,N=128,device_name=NVIDIA_H100_80GB_HBM3.json
- E=512,N=128,device_name=NVIDIA_H20-3e.json
- E=512,N=128,device_name=NVIDIA_H200.json
- E=512,N=256,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=512,N=256,device_name=NVIDIA_B200.json
- E=512,N=256,device_name=NVIDIA_GB200,dtype=fp8_w8a8.json
- E=512,N=256,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8,block_shape=[128,128].json
- E=512,N=256,device_name=NVIDIA_H100_80GB_HBM3.json
- E=512,N=256,device_name=NVIDIA_H20-3e.json
- E=512,N=256,device_name=NVIDIA_H200.json
- E=512,N=512,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=512,N=512,device_name=NVIDIA_B200.json
- E=512,N=512,device_name=NVIDIA_GB200,dtype=fp8_w8a8.json
- E=512,N=512,device_name=NVIDIA_H100_80GB_HBM3.json
- E=512,N=512,device_name=NVIDIA_H20-3e.json
- E=512,N=512,device_name=NVIDIA_H200.json
- E=512,N=64,device_name=NVIDIA_A100-SXM4-80GB.json
- E=512,N=64,device_name=NVIDIA_B200.json
- E=512,N=64,device_name=NVIDIA_H20-3e.json
- E=512,N=64,device_name=NVIDIA_H200.json
- E=60,N=1408,device_name=AMD_Instinct_MI300X.json
- E=60,N=176,device_name=AMD_Instinct_MI300X.json
- E=60,N=352,device_name=AMD_Instinct_MI300X.json
- E=60,N=704,device_name=AMD_Instinct_MI300X.json
- E=62,N=128,device_name=AMD_Instinct_MI300X.json
- E=62,N=256,device_name=AMD_Instinct_MI300X.json
- E=62,N=256,device_name=NVIDIA_H100_80GB_HBM3.json
- E=62,N=512,device_name=AMD_Instinct_MI300X.json
- E=62,N=512,device_name=NVIDIA_H100_80GB_HBM3.json
- E=64,N=1280,device_name=NVIDIA_A100-SXM4-80GB.json
- E=64,N=1280,device_name=NVIDIA_A800-SXM4-80GB.json
- E=64,N=1280,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=64,N=1280,device_name=NVIDIA_H100_80GB_HBM3.json
- E=64,N=1280,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=64,N=1280,device_name=NVIDIA_H200.json
- E=64,N=1408,device_name=NVIDIA_B200.json
- E=64,N=1536,device_name=NVIDIA_H20,dtype=fp8_w8a8.json
- E=64,N=2560,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=64,N=2560,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=64,N=2560,device_name=NVIDIA_H200.json
- E=64,N=3072,device_name=NVIDIA_H20,dtype=fp8_w8a8.json
- E=64,N=3072,device_name=NVIDIA_H20.json
- E=64,N=320,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=64,N=320,device_name=NVIDIA_H100_80GB_HBM3.json
- E=64,N=320,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=64,N=320,device_name=NVIDIA_H200.json
- E=64,N=384,device_name=NVIDIA_H20,dtype=fp8_w8a8.json
- E=64,N=384,device_name=NVIDIA_H20.json
- E=64,N=512,device_name=NVIDIA_B200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=64,N=640,device_name=NVIDIA_A100-SXM4-80GB.json
- E=64,N=640,device_name=NVIDIA_A800-SXM4-80GB.json
- E=64,N=640,device_name=NVIDIA_GeForce_RTX_4090,dtype=fp8_w8a8.json
- E=64,N=640,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=64,N=640,device_name=NVIDIA_H100_80GB_HBM3.json
- E=64,N=640,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=64,N=640,device_name=NVIDIA_H200.json
- E=64,N=768,device_name=NVIDIA_H100_PCIe,dtype=fp8_w8a8,block_shape=[128,128].json
- E=64,N=768,device_name=NVIDIA_H20,dtype=fp8_w8a8.json
- E=64,N=768,device_name=NVIDIA_H20.json
- E=64,N=896,device_name=NVIDIA_H20.json
- E=64,N=8960,device_name=NVIDIA_H100_80GB_HBM3,dtype=bf16.json
- E=64,N=8960,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=72,N=192,device_name=AMD_Instinct_MI300X.json
- E=72,N=384,device_name=AMD_Instinct_MI300X.json
- E=72,N=384,device_name=NVIDIA_H100_80GB_HBM3.json
- E=72,N=768,device_name=AMD_Instinct_MI300X.json
- E=72,N=768,device_name=NVIDIA_H100_80GB_HBM3.json
- E=8,N=14336,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8.json
- E=8,N=14336,device_name=AMD_Instinct_MI300X.json
- E=8,N=14336,device_name=AMD_Instinct_MI325X,dtype=fp8_w8a8.json
- E=8,N=14336,device_name=AMD_Instinct_MI325X.json
- E=8,N=14336,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=8,N=14336,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=8,N=14336,device_name=NVIDIA_H200.json
- E=8,N=16384,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8.json
- E=8,N=16384,device_name=AMD_Instinct_MI300X.json
- E=8,N=16384,device_name=AMD_Instinct_MI325X,dtype=fp8_w8a8.json
- E=8,N=16384,device_name=AMD_Instinct_MI325X.json
- E=8,N=1792,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8.json
- E=8,N=1792,device_name=AMD_Instinct_MI300X.json
- E=8,N=1792,device_name=AMD_Instinct_MI325X,dtype=fp8_w8a8.json
- E=8,N=1792,device_name=AMD_Instinct_MI325X.json
- E=8,N=1792,device_name=NVIDIA_A100-SXM4-40GB.json
- E=8,N=1792,device_name=NVIDIA_A100-SXM4-80GB.json
- E=8,N=1792,device_name=NVIDIA_H100_80GB_HBM3.json
- E=8,N=1792,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=8,N=1792,device_name=NVIDIA_H200.json
- E=8,N=2048,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8.json
- E=8,N=2048,device_name=AMD_Instinct_MI300X.json
- E=8,N=2048,device_name=AMD_Instinct_MI325X,dtype=fp8_w8a8.json
- E=8,N=2048,device_name=AMD_Instinct_MI325X.json
- E=8,N=2048,device_name=NVIDIA_A100-SXM4-80GB.json
- E=8,N=2048,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=8,N=2048,device_name=NVIDIA_H100_80GB_HBM3.json
- E=8,N=2048,device_name=NVIDIA_H200,dtype=fp8_w8a8,block_shape=[128,128].json
- E=8,N=2048,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=8,N=2048,device_name=NVIDIA_H200.json
- E=8,N=3584,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8.json
- E=8,N=3584,device_name=AMD_Instinct_MI300X.json
- E=8,N=3584,device_name=AMD_Instinct_MI325X,dtype=fp8_w8a8.json
- E=8,N=3584,device_name=AMD_Instinct_MI325X.json
- E=8,N=3584,device_name=NVIDIA_A100-SXM4-40GB.json
- E=8,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json
- E=8,N=3584,device_name=NVIDIA_GeForce_RTX_4090,dtype=fp8_w8a8.json
- E=8,N=3584,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=8,N=3584,device_name=NVIDIA_H100_80GB_HBM3.json
- E=8,N=3584,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=8,N=3584,device_name=NVIDIA_H200.json
- E=8,N=3584,device_name=NVIDIA_L40S.json
- E=8,N=4096,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8.json
- E=8,N=4096,device_name=AMD_Instinct_MI300X.json
- E=8,N=4096,device_name=AMD_Instinct_MI325X,dtype=fp8_w8a8.json
- E=8,N=4096,device_name=AMD_Instinct_MI325X.json
- E=8,N=4096,device_name=NVIDIA_A100-SXM4-80GB.json
- E=8,N=4096,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=8,N=4096,device_name=NVIDIA_H100_80GB_HBM3.json
- E=8,N=4096,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=8,N=4096,device_name=NVIDIA_H200.json
- E=8,N=7168,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8.json
- E=8,N=7168,device_name=AMD_Instinct_MI300X.json
- E=8,N=7168,device_name=AMD_Instinct_MI325X,dtype=fp8_w8a8.json
- E=8,N=7168,device_name=AMD_Instinct_MI325X.json
- E=8,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json
- E=8,N=7168,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=8,N=7168,device_name=NVIDIA_H100_80GB_HBM3.json
- E=8,N=7168,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- E=8,N=7168,device_name=NVIDIA_H200.json
- E=8,N=8192,device_name=AMD_Instinct_MI300X,dtype=fp8_w8a8.json
- E=8,N=8192,device_name=AMD_Instinct_MI300X.json
- E=8,N=8192,device_name=AMD_Instinct_MI325X,dtype=fp8_w8a8.json
- E=8,N=8192,device_name=AMD_Instinct_MI325X.json
- E=8,N=8192,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json
- E=8,N=8192,device_name=NVIDIA_H200,dtype=fp8_w8a8.json
- README