File tree Expand file tree Collapse file tree 3 files changed +7
-3
lines changed
python/sglang/srt/layers/attention Expand file tree Collapse file tree 3 files changed +7
-3
lines changed Original file line number Diff line number Diff line change @@ -56,6 +56,7 @@ def create_aiter_backend(runner):
5656def create_wave_backend (runner ):
5757 try :
5858 from sglang .srt .layers .attention .wave_backend import WaveAttnBackend
59+
5960 return WaveAttnBackend (runner )
6061 except ImportError as e :
6162 if "wave_lang" in str (e ):
Original file line number Diff line number Diff line change 1313
1414_is_hip = is_hip ()
1515if _is_hip :
16- hicache_args = ["--hicache-size" , 200 ]
16+ hicache_args = ["--hicache-size" , 40 ]
17+ mem_frac_args = ["--mem-fraction-static" , 0.2 ]
1718else :
1819 hicache_args = ["--hicache-ratio" , 2 ]
20+ mem_frac_args = []
1921
2022
2123class TestHierarchicalMLA (CustomTestCase ):
@@ -32,6 +34,7 @@ def setUpClass(cls):
3234 "--enable-hierarchical-cache" ,
3335 ]
3436 + hicache_args ,
37+ + mem_frac_args ,
3538 )
3639
3740 @classmethod
Original file line number Diff line number Diff line change @@ -26,9 +26,9 @@ def setUpClass(cls):
2626 other_args = [
2727 "--enable-hierarchical-cache" ,
2828 "--mem-fraction-static" ,
29- 0.7 ,
29+ 0.7 if not _is_hip else 0.2 ,
3030 "--hicache-size" ,
31- 100 if not _is_hip else 200 ,
31+ 100 if not _is_hip else 40 ,
3232 "--page-size" ,
3333 "64" ,
3434 "--hicache-storage-backend" ,
You can’t perform that action at this time.
0 commit comments