@@ -51,14 +51,14 @@ def get_single_decode_uri(
5151 use_logits_soft_cap : bool ,
5252) -> str :
5353 return (
54- f"single_decode_with_kv_cache_dtype_q_ { filename_safe_dtype_map [dtype_q ]} _"
55- f"dtype_kv_ { filename_safe_dtype_map [dtype_kv ]} _"
56- f"dtype_o_ { filename_safe_dtype_map [dtype_o ]} _"
57- f"head_dim_qk_ { head_dim_qk } _"
58- f"head_dim_vo_ { head_dim_vo } _"
59- f"posenc_ { pos_encoding_mode } _"
60- f"use_swa_ { use_sliding_window } _"
61- f"use_logits_cap_ { use_logits_soft_cap } "
54+ f"sdkvcd_q_ { filename_safe_dtype_map [dtype_q ]} _"
55+ f"kv_ { filename_safe_dtype_map [dtype_kv ]} _"
56+ f"o_ { filename_safe_dtype_map [dtype_o ]} _"
57+ f"qk_ { head_dim_qk } _"
58+ f"vo_ { head_dim_vo } _"
59+ f"pe_ { pos_encoding_mode } _"
60+ f"swa_ { use_sliding_window } _"
61+ f"lc_ { use_logits_soft_cap } "
6262 )
6363
6464
@@ -74,15 +74,15 @@ def get_batch_decode_uri(
7474 use_logits_soft_cap : bool ,
7575) -> str :
7676 return (
77- f"batch_decode_with_kv_cache_dtype_q_ { filename_safe_dtype_map [dtype_q ]} _"
78- f"dtype_kv_ { filename_safe_dtype_map [dtype_kv ]} _"
79- f"dtype_o_ { filename_safe_dtype_map [dtype_o ]} _"
80- f"dtype_idx_ { filename_safe_dtype_map [dtype_idx ]} _"
81- f"head_dim_qk_ { head_dim_qk } _"
82- f"head_dim_vo_ { head_dim_vo } _"
83- f"posenc_ { pos_encoding_mode } _"
84- f"use_swa_ { use_sliding_window } _"
85- f"use_logits_cap_ { use_logits_soft_cap } "
77+ f"bdkvcd_q_ { filename_safe_dtype_map [dtype_q ]} _"
78+ f"kv_ { filename_safe_dtype_map [dtype_kv ]} _"
79+ f"o_ { filename_safe_dtype_map [dtype_o ]} _"
80+ f"idx_ { filename_safe_dtype_map [dtype_idx ]} _"
81+ f"qk_ { head_dim_qk } _"
82+ f"vo_ { head_dim_vo } _"
83+ f"pe_ { pos_encoding_mode } _"
84+ f"swa_ { use_sliding_window } _"
85+ f"lc_ { use_logits_soft_cap } "
8686 )
8787
8888
@@ -97,13 +97,13 @@ def get_batch_mla_uri(
9797 use_profiler : bool ,
9898) -> str :
9999 return (
100- f"batch_mla_attention_dtype_q_ { filename_safe_dtype_map [dtype_q ]} _"
101- f"dtype_kv_ { filename_safe_dtype_map [dtype_kv ]} _"
102- f"dtype_o_ { filename_safe_dtype_map [dtype_o ]} _"
103- f"dtype_idx_ { filename_safe_dtype_map [dtype_idx ]} _"
104- f"head_dim_ckv_ { head_dim_ckv } _"
105- f"head_dim_kpe_ { head_dim_kpe } _"
106- f"profiler_ { use_profiler } "
100+ f"bmad_q_ { filename_safe_dtype_map [dtype_q ]} _"
101+ f"kv_ { filename_safe_dtype_map [dtype_kv ]} _"
102+ f"o_ { filename_safe_dtype_map [dtype_o ]} _"
103+ f"idx_ { filename_safe_dtype_map [dtype_idx ]} _"
104+ f"ckv_ { head_dim_ckv } _"
105+ f"kpe_ { head_dim_kpe } _"
106+ f"pr_ { use_profiler } "
107107 ) + ("_sm90" if backend == "fa3" else "" )
108108
109109
@@ -214,13 +214,13 @@ def get_batch_decode_mla_uri(
214214 arc : str ,
215215) -> str :
216216 return (
217- f"batch_decode_mla_with_kv_cache_dtype_q_ { filename_safe_dtype_map [dtype_q ]} _"
218- f"dtype_kv_ { filename_safe_dtype_map [dtype_kv ]} _"
219- f"dtype_o_ { filename_safe_dtype_map [dtype_o ]} _"
220- f"dtype_idx_ { filename_safe_dtype_map [dtype_idx ]} _"
221- f"head_dim_ckv { head_dim_ckv } _"
222- f"use_swa_ { use_sliding_window } _"
223- f"use_logits_cap_ { use_logits_soft_cap } _"
217+ f"bdmkvcd_q_ { filename_safe_dtype_map [dtype_q ]} _"
218+ f"kv_ { filename_safe_dtype_map [dtype_kv ]} _"
219+ f"o_ { filename_safe_dtype_map [dtype_o ]} _"
220+ f"idx_ { filename_safe_dtype_map [dtype_idx ]} _"
221+ f"ckv { head_dim_ckv } _"
222+ f"swa_ { use_sliding_window } _"
223+ f"lc_ { use_logits_soft_cap } _"
224224 f"arc_{ arc } "
225225 )
226226
@@ -326,14 +326,14 @@ def get_single_prefill_uri(
326326 use_fp16_qk_reduction : bool ,
327327) -> str :
328328 return (
329- f"single_prefill_with_kv_cache_dtype_q_ { filename_safe_dtype_map [dtype_q ]} _"
330- f"dtype_kv_ { filename_safe_dtype_map [dtype_kv ]} _"
331- f"dtype_o_ { filename_safe_dtype_map [dtype_o ]} _"
332- f"head_dim_qk_ { head_dim_qk } _"
333- f"head_dim_vo_ { head_dim_vo } _"
334- f"posenc_ { pos_encoding_mode } _"
335- f"use_swa_ { use_sliding_window } _"
336- f"use_logits_cap_ { use_logits_soft_cap } _"
329+ f"spkvcd_q_ { filename_safe_dtype_map [dtype_q ]} _"
330+ f"kv_ { filename_safe_dtype_map [dtype_kv ]} _"
331+ f"o_ { filename_safe_dtype_map [dtype_o ]} _"
332+ f"qk_ { head_dim_qk } _"
333+ f"vo_ { head_dim_vo } _"
334+ f"pe_ { pos_encoding_mode } _"
335+ f"swa_ { use_sliding_window } _"
336+ f"lc_ { use_logits_soft_cap } _"
337337 f"f16qk_{ use_fp16_qk_reduction } " + ("_sm90" if backend == "fa3" else "" )
338338 )
339339
@@ -353,17 +353,17 @@ def get_pod_uri(
353353 use_logits_soft_cap_d : bool ,
354354) -> str :
355355 return (
356- f"pod_with_kv_cache_dtype_q_ { filename_safe_dtype_map [dtype_q ]} _"
357- f"dtype_kv_ { filename_safe_dtype_map [dtype_kv ]} _"
358- f"dtype_o_ { filename_safe_dtype_map [dtype_o ]} _"
359- f"head_dim_ { head_dim } _"
360- f"posenc_p_ { pos_encoding_mode_p } _"
361- f"use_swa_p_ { use_sliding_window_p } _"
362- f"use_logits_cap_p_ { use_logits_soft_cap_p } _"
363- f"posenc_d_ { pos_encoding_mode_d } _"
364- f"use_swa_d_ { use_sliding_window_d } _"
365- f"use_logits_cap_d_ { use_logits_soft_cap_d } _"
366- f"dtype_idx_ { filename_safe_dtype_map [dtype_idx ]} _"
356+ f"pkvcd_q_ { filename_safe_dtype_map [dtype_q ]} _"
357+ f"kv_ { filename_safe_dtype_map [dtype_kv ]} _"
358+ f"o_ { filename_safe_dtype_map [dtype_o ]} _"
359+ f"hd_ { head_dim } _"
360+ f"pe_p_ { pos_encoding_mode_p } _"
361+ f"swa_p_ { use_sliding_window_p } _"
362+ f"lc_p_ { use_logits_soft_cap_p } _"
363+ f"pe_d_ { pos_encoding_mode_d } _"
364+ f"swa_d_ { use_sliding_window_d } _"
365+ f"lc_d_ { use_logits_soft_cap_d } _"
366+ f"idx_ { filename_safe_dtype_map [dtype_idx ]} _"
367367 f"f16qk_{ use_fp16_qk_reduction } "
368368 )
369369
@@ -382,15 +382,15 @@ def get_batch_prefill_uri(
382382 use_fp16_qk_reduction : bool ,
383383) -> str :
384384 return (
385- f"batch_prefill_with_kv_cache_dtype_q_ { filename_safe_dtype_map [dtype_q ]} _"
386- f"dtype_kv_ { filename_safe_dtype_map [dtype_kv ]} _"
387- f"dtype_o_ { filename_safe_dtype_map [dtype_o ]} _"
388- f"dtype_idx_ { filename_safe_dtype_map [dtype_idx ]} _"
389- f"head_dim_qk_ { head_dim_qk } _"
390- f"head_dim_vo_ { head_dim_vo } _"
391- f"posenc_ { pos_encoding_mode } _"
392- f"use_swa_ { use_sliding_window } _"
393- f"use_logits_cap_ { use_logits_soft_cap } _"
385+ f"bpkvcd_q_ { filename_safe_dtype_map [dtype_q ]} _"
386+ f"kv_ { filename_safe_dtype_map [dtype_kv ]} _"
387+ f"o_ { filename_safe_dtype_map [dtype_o ]} _"
388+ f"idx_ { filename_safe_dtype_map [dtype_idx ]} _"
389+ f"qk_ { head_dim_qk } _"
390+ f"vo_ { head_dim_vo } _"
391+ f"pe_ { pos_encoding_mode } _"
392+ f"swa_ { use_sliding_window } _"
393+ f"lc_ { use_logits_soft_cap } _"
394394 f"f16qk_{ use_fp16_qk_reduction } " + ("_sm90" if backend == "fa3" else "" )
395395 )
396396
@@ -407,13 +407,13 @@ def get_batch_prefill_attention_sink_uri(
407407 use_sliding_window : bool ,
408408) -> str :
409409 return (
410- f"batch_prefill_with_attention_sink_kv_cache_dtype_q_ { filename_safe_dtype_map [dtype_q ]} _"
411- f"dtype_kv_ { filename_safe_dtype_map [dtype_kv ]} _"
412- f"dtype_o_ { filename_safe_dtype_map [dtype_o ]} _"
413- f"dtype_idx_ { filename_safe_dtype_map [dtype_idx ]} _"
414- f"head_dim_qk_ { head_dim_qk } _"
415- f"head_dim_vo_ { head_dim_vo } _"
416- f"use_swa_ { use_sliding_window } _" + ("_sm90" if backend == "fa3" else "" )
410+ f"bpaskvcd_q_ { filename_safe_dtype_map [dtype_q ]} _"
411+ f"kv_ { filename_safe_dtype_map [dtype_kv ]} _"
412+ f"o_ { filename_safe_dtype_map [dtype_o ]} _"
413+ f"idx_ { filename_safe_dtype_map [dtype_idx ]} _"
414+ f"qk_ { head_dim_qk } _"
415+ f"vo_ { head_dim_vo } _"
416+ f"swa_ { use_sliding_window } _" + ("_sm90" if backend == "fa3" else "" )
417417 )
418418
419419
@@ -429,15 +429,15 @@ def get_batch_attention_uri(
429429 use_profiler : bool ,
430430) -> str :
431431 return (
432- f"batch_attention_with_kv_cache_dtype_q_ { filename_safe_dtype_map [dtype_q ]} _"
433- f"dtype_kv_ { filename_safe_dtype_map [dtype_kv ]} _"
434- f"dtype_o_ { filename_safe_dtype_map [dtype_o ]} _"
435- f"dtype_idx_ { filename_safe_dtype_map [dtype_idx ]} _"
436- f"head_dim_qk_ { head_dim_qk } _"
437- f"head_dim_vo_ { head_dim_vo } _"
438- f"posenc_ { pos_encoding_mode } _"
439- f"use_logits_soft_cap_ { str (use_logits_soft_cap ).lower ()} _"
440- f"use_profiler_ { str (use_profiler ).lower ()} "
432+ f"bakvcd_q_ { filename_safe_dtype_map [dtype_q ]} _"
433+ f"kv_ { filename_safe_dtype_map [dtype_kv ]} _"
434+ f"o_ { filename_safe_dtype_map [dtype_o ]} _"
435+ f"idx_ { filename_safe_dtype_map [dtype_idx ]} _"
436+ f"qk_ { head_dim_qk } _"
437+ f"vo_ { head_dim_vo } _"
438+ f"pe_ { pos_encoding_mode } _"
439+ f"lc_ { str (use_logits_soft_cap ).lower ()} _"
440+ f"pr_ { str (use_profiler ).lower ()} "
441441 )
442442
443443
@@ -654,7 +654,7 @@ def gen_batch_pod_module(
654654 use_sliding_window_d : bool ,
655655 use_logits_soft_cap_d : bool ,
656656) -> JitSpec :
657- uri = "batch_ " + get_pod_uri (
657+ uri = "b " + get_pod_uri (
658658 dtype_q ,
659659 dtype_kv ,
660660 dtype_o ,
0 commit comments