Enhance autogptq backend to support VL models (#1860)

* Enhance autogptq backend to support VL models * update dependencies for autogptq * remove redundant auto-gptq dependency * Convert base64 to image_url for Qwen-VL model * implemented model inference for qwen-vl * remove user prompt from generated answer * fixed write image error --------- Co-authored-by: Binghua Wu <bingwu@estee.com>
2025-05-29 06:54:59 +00:00 · 2024-03-27 01:48:14 +08:00 · 2024-03-27 01:48:14 +08:00 · b7ffe66219
commit b7ffe66219
parent e58410fa99
5 changed files with 75 additions and 18 deletions
--- a/backend/python/autogptq/autogptq.yml
+++ b/backend/python/autogptq/autogptq.yml
@ -1,3 +1,7 @@
+####
+# Attention! This file is abandoned. 
+# Please use the ../common-env/transformers/transformers.yml file to manage dependencies.
+###
 name: autogptq
 channels:
  - defaults
@ -24,12 +28,12 @@ dependencies:
  - xz=5.4.2=h5eee18b_0
  - zlib=1.2.13=h5eee18b_0
  - pip:
-      - accelerate==0.23.0
+      - accelerate==0.27.0
      - aiohttp==3.8.5
      - aiosignal==1.3.1
      - async-timeout==4.0.3
      - attrs==23.1.0
-      - auto-gptq==0.4.2
+      - auto-gptq==0.7.1
      - certifi==2023.7.22
      - charset-normalizer==3.3.0
      - datasets==2.14.5
@ -59,6 +63,7 @@ dependencies:
      - nvidia-nccl-cu12==2.18.1
      - nvidia-nvjitlink-cu12==12.2.140
      - nvidia-nvtx-cu12==12.1.105
+      - optimum==1.17.1
      - packaging==23.2
      - pandas==2.1.1
      - peft==0.5.0
@ -75,9 +80,11 @@ dependencies:
      - six==1.16.0
      - sympy==1.12
      - tokenizers==0.14.0
-      - torch==2.1.0
      - tqdm==4.66.1
+      - torch==2.2.1
+      - torchvision==0.17.1
      - transformers==4.34.0
+      - transformers_stream_generator==0.0.5
      - triton==2.1.0
      - typing-extensions==4.8.0
      - tzdata==2023.3