Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
18 commits
Select commit Hold shift + click to select a range
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions aiter/configs/tuned_fmoe.csv
Original file line number Diff line number Diff line change
Expand Up @@ -786,3 +786,4 @@ cu_num,token,model_dim,inter_dim,expert,topk,act_type,dtype,q_dtype_a,q_dtype_w,
80,256,7168,2048,33,10,ActivationType.Silu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_Token,1,0,32,0,1021.9423,_ZN5aiter45fmoe_bf16_pertokenFp8_g1u1_vs_silu_1tg_32x512E,5.4%,0.0,Null,0.0%,1021.9423,1,220.64,1427.51
80,512,7168,2048,33,10,ActivationType.Silu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_Token,1,0,32,0,1749.1923,_ZN5aiter45fmoe_bf16_pertokenFp8_g1u1_vs_silu_1tg_32x512E,5.4%,0.0,Null,0.0%,1749.1923,1,257.82,837.15
80,1024,7168,2048,33,10,ActivationType.Silu,torch.bfloat16,torch.float8_e4m3fnuz,torch.float8_e4m3fnuz,QuantType.per_Token,1,0,32,0,3226.5114,_ZN5aiter45fmoe_bf16_pertokenFp8_g1u1_vs_silu_1tg_32x512E,5.3%,0.0,Null,0.0%,3226.5114,1,279.54,457.26
256,16,5120,1024,128,1,ActivationType.Silu,torch.bfloat16,torch.float8_e4m3fn,torch.float8_e4m3fn,QuantType.per_Token,1,1,32,0,0.0,_ZN5aiter46fmoe_bf16_pertokenFp8_g1u1_tkw1_silu_1tg_32x64E,0.0%,0.0,Null,0,0.0,1,0.0,0.0
Original file line number Diff line number Diff line change
Expand Up @@ -13,3 +13,4 @@ _ZN5aiter50fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_gelu_1tg_32x256E,fmoe_bf16_pertoke
_ZN5aiter50fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_gelu_1tg_32x512E,fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_gelu_1tg_32x512.co,0,1,0,1,0,32,512
_ZN5aiter50fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_gelu_1tg_32x384E,fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_gelu_1tg_32x384.co,0,1,0,1,0,32,384
_ZN5aiter53fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_gelu_1tg_ps_32x448E,fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_gelu_1tg_ps_32x448.co,0,1,0,1,1,32,448
_ZN5aiter46fmoe_bf16_pertokenFp8_g1u1_tkw1_gelu_1tg_32x64E,fmoe_bf16_pertokenFp8_g1u1_tkw1_gelu_1tg_32x64.co,0,0,0,1,0,32,64
Binary file not shown.
Original file line number Diff line number Diff line change
Expand Up @@ -13,3 +13,4 @@ _ZN5aiter50fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_silu_1tg_32x448E,fmoe_bf16_pertoke
_ZN5aiter50fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_silu_1tg_32x128E,fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_silu_1tg_32x128.co,0,1,0,1,0,32,128
_ZN5aiter50fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_silu_1tg_32x192E,fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_silu_1tg_32x192.co,0,1,0,1,0,32,192
_ZN5aiter53fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_silu_1tg_ps_32x512E,fmoe_bf16_pertokenFp8_g1u1_vs_tkw1_silu_1tg_ps_32x512.co,0,1,0,1,1,32,512
_ZN5aiter46fmoe_bf16_pertokenFp8_g1u1_tkw1_silu_1tg_32x64E,fmoe_bf16_pertokenFp8_g1u1_tkw1_silu_1tg_32x64.co,0,0,0,1,0,32,64
Binary file not shown.