Remove outdated TODO

huggingface · Feb 7, 2025 · fc3ac80 · fc3ac80
1 parent df582a1
commit fc3ac80
Showing 1 changed file with 0 additions and 1 deletion.
diff --git a/server/text_generation_server/layers/fp8.py b/server/text_generation_server/layers/fp8.py
@@ -23,7 +23,6 @@
     quantization = None
 
 try:
-    # TODO: needs to be ported over to MoE and used on CUDA.
     from moe_kernels.fp8_utils import w8a8_block_fp8_matmul, per_token_group_quant_fp8
 except ImportError:
     w8a8_block_fp8_matmul = None