sh2orc commited on
Commit
a3dcd69
·
verified ·
1 Parent(s): 9a0e866

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +5 -5
README.md CHANGED
@@ -8,22 +8,22 @@ license_link: >-
8
  https://huggingface.co/datasets/choosealicense/licenses/blob/main/markdown/apache-2.0.md
9
  language:
10
  - en
11
- base_model: Qwen/Qwen2.5-VL-72B-Instruct
12
  library_name: transformers
13
  ---
14
 
15
  # Qwen2.5-VL-32B-Instruct-FP8-Dynamic
16
 
17
  ## Model Overview
18
- - **Model Architecture:** Qwen2.5-VL-72B-Instruct
19
  - **Input:** Vision-Text
20
  - **Output:** Text
21
  - **Model Optimizations:**
22
  - **Weight quantization:** FP8
23
  - **Activation quantization:** FP8
24
- - **Release Date:** 2/24/2025
25
  - **Version:** 1.0
26
- - **Model Developers:** Neural Magic
27
 
28
  Quantized version of [Qwen/Qwen2.5-VL-32B-Instruct](https://huggingface.co/Qwen/Qwen2.5-VL-32B-Instruct).
29
 
@@ -43,7 +43,7 @@ from vllm import LLM, SamplingParams
43
 
44
  # prepare model
45
  llm = LLM(
46
- model="BCCard/Qwen2.5-VL-72B-Instruct-FP8-Dynamic",
47
  trust_remote_code=True,
48
  max_model_len=4096,
49
  max_num_seqs=2,
 
8
  https://huggingface.co/datasets/choosealicense/licenses/blob/main/markdown/apache-2.0.md
9
  language:
10
  - en
11
+ base_model: Qwen/Qwen2.5-VL-32B-Instruct
12
  library_name: transformers
13
  ---
14
 
15
  # Qwen2.5-VL-32B-Instruct-FP8-Dynamic
16
 
17
  ## Model Overview
18
+ - **Model Architecture:** Qwen2.5-VL-32B-Instruct
19
  - **Input:** Vision-Text
20
  - **Output:** Text
21
  - **Model Optimizations:**
22
  - **Weight quantization:** FP8
23
  - **Activation quantization:** FP8
24
+ - **Release Date:** 5/3/2025
25
  - **Version:** 1.0
26
+ - **Model Developers:** BC Card
27
 
28
  Quantized version of [Qwen/Qwen2.5-VL-32B-Instruct](https://huggingface.co/Qwen/Qwen2.5-VL-32B-Instruct).
29
 
 
43
 
44
  # prepare model
45
  llm = LLM(
46
+ model="BCCard/Qwen2.5-VL-32B-Instruct-FP8-Dynamic",
47
  trust_remote_code=True,
48
  max_model_len=4096,
49
  max_num_seqs=2,