@@ -577,10 +577,11 @@ def apply( # pylint: disable=too-many-locals,missing-docstring
577577 i0 , i1 , i2 , i3 = sch .split (i , factors = i_factors )
578578 j0 , j1 , j2 , j3 = sch .split (j , factors = j_factors )
579579 k0 , k1 = sch .split (k , k_factors )
580- sch .annotate (k0 , "software_pipeline_order" , [0 , 3 , 1 , 4 , 5 , 2 , 6 ])
581- sch .annotate (k0 , "software_pipeline_stage" , [0 , 0 , 0 , 0 , 0 , 1 , 1 ])
582- sch .annotate (k1 , "software_pipeline_order" , [0 , 1 , 2 ])
583- sch .annotate (k1 , "software_pipeline_stage" , [0 , 0 , 1 ])
580+ if target .arch .startswith ("sm_" ) and int (target .arch [- 2 :]) > 75 :
581+ sch .annotate (k0 , "software_pipeline_order" , [0 , 3 , 1 , 4 , 5 , 2 , 6 ])
582+ sch .annotate (k0 , "software_pipeline_stage" , [0 , 0 , 0 , 0 , 0 , 1 , 1 ])
583+ sch .annotate (k1 , "software_pipeline_order" , [0 , 1 , 2 ])
584+ sch .annotate (k1 , "software_pipeline_stage" , [0 , 0 , 1 ])
584585
585586 sch .reorder (i0 , j0 , i1 , j1 , j2 , i2 , k0 , k1 , i3 , j3 )
586587
@@ -798,10 +799,11 @@ def apply( # pylint: disable=too-many-locals,missing-docstring
798799 i0 , i1 , i2 , i3 = sch .split (i , factors = i_factors )
799800 j0 , j1 , j2 , j3 = sch .split (j , factors = j_factors )
800801 k0 , k1 = sch .split (k , k_factors )
801- sch .annotate (k0 , "software_pipeline_order" , [0 , 3 , 1 , 4 , 5 , 2 , 6 ])
802- sch .annotate (k0 , "software_pipeline_stage" , [0 , 0 , 0 , 0 , 0 , 1 , 1 ])
803- sch .annotate (k1 , "software_pipeline_order" , [0 , 1 , 2 ])
804- sch .annotate (k1 , "software_pipeline_stage" , [0 , 0 , 1 ])
802+ if target .arch .startswith ("sm_" ) and int (target .arch [- 2 :]) > 75 :
803+ sch .annotate (k0 , "software_pipeline_order" , [0 , 3 , 1 , 4 , 5 , 2 , 6 ])
804+ sch .annotate (k0 , "software_pipeline_stage" , [0 , 0 , 0 , 0 , 0 , 1 , 1 ])
805+ sch .annotate (k1 , "software_pipeline_order" , [0 , 1 , 2 ])
806+ sch .annotate (k1 , "software_pipeline_stage" , [0 , 0 , 1 ])
805807
806808 sch .reorder (i0 , j0 , i1 , j1 , j2 , i2 , k0 , k1 , i3 , j3 )
807809
0 commit comments