mudler · mudler · Apr 10, 2024 · Mar 19, 2024 · Mar 19, 2024 · Mar 19, 2024
diff --git a/backend/python/autogptq/autogptq.py b/backend/python/autogptq/autogptq.py
@@ -39,7 +39,6 @@ def LoadModel(self, request, context):
                 self.model_name = "Qwen-VL-Chat"
                 model = AutoModelForCausalLM.from_pretrained(model_path, 
                     trust_remote_code=request.TrustRemoteCode,
-                    use_triton=request.UseTriton,
                     device_map="auto").eval()
             else:
                 model = AutoGPTQForCausalLM.from_quantized(model_path,