You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: src/MaxText/configs/base.yml
+1Lines changed: 1 addition & 0 deletions
Original file line number
Diff line number
Diff line change
@@ -174,6 +174,7 @@ num_experts: 1
174
174
num_experts_per_tok: 1
175
175
megablox: True
176
176
sparse_matmul: True
177
+
use_turbo_grouped_gemm: false # Use Primus Turbo grouped GEMM for MoE sparse matmul. Requires sparse_matmul=True, megablox=False, and primus_turbo installed.
177
178
capacity_factor: -1.0# a factor to decide expert capacity for token dropping, and no dropping by default
178
179
load_balance_loss_weight: 0.01# weight for the load balance loss
179
180
expert_balance: False # whether or not to do expert balancing
0 commit comments