diff --git a/server/text_generation_server/models/custom_modeling/qwen2_vl.py b/server/text_generation_server/models/custom_modeling/qwen2_vl.py index 4edd336d96d..3bb29b9bca3 100644 --- a/server/text_generation_server/models/custom_modeling/qwen2_vl.py +++ b/server/text_generation_server/models/custom_modeling/qwen2_vl.py @@ -22,9 +22,9 @@ from text_generation_server.utils.import_utils import SYSTEM if SYSTEM == "ipex": - import intel_extension_for_pytorch as ipex + pass else: - import flash_attn_2_cuda + pass from transformers.activations import ACT2FN import torch.nn.functional as F @@ -358,7 +358,7 @@ def __init__(self, prefix, config, weights): self.video_token_id = config.video_token_id self.spatial_merge_size = config.vision_config.spatial_merge_size self.embed_tokens = TensorParallelEmbedding( - prefix=f"model.embed_tokens", weights=weights + prefix="model.embed_tokens", weights=weights ) self.visual = Qwen2VisionModel( prefix="visual", config=config.vision_config, weights=weights