Spaces:

OpenSourceRonin
/

VPTQ_demo

Running on Zero

OpenSourceRonin commited on 1 day ago

Commit

9da61be

•

1 Parent(s): cc040f7

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -12,6 +12,14 @@ from huggingface_hub import snapshot_download
 from vptq.app_utils import get_chat_loop_generator
 models = [
     {
         "name": "VPTQ-community/Meta-Llama-3.1-70B-Instruct-v16-k65536-65536-woft",
         "bits": "2 bits"
@@ -24,10 +32,6 @@ models = [
         "name": "VPTQ-community/Meta-Llama-3.1-70B-Instruct-v8-k65536-65536-woft",
         "bits": "4 bits"
     },
-    {
-        "name": "VPTQ-community/Meta-Llama-3.1-8B-Instruct-v8-k65536-65536-woft",
-        "bits": "4 bits"
-    },
     {
         "name": "VPTQ-community/Qwen2.5-72B-Instruct-v8-k65536-65536-woft",
         "bits": "4 bits"

 from vptq.app_utils import get_chat_loop_generator
 models = [
+    {
+        "name": "VPTQ-community/Meta-Llama-3.1-8B-Instruct-v8-k65536-256-woft",
+        "bits": "3 bits"
+    },
+    {
+        "name": "VPTQ-community/Meta-Llama-3.1-8B-Instruct-v8-k65536-65536-woft",
+        "bits": "4 bits"
+    },
     {
         "name": "VPTQ-community/Meta-Llama-3.1-70B-Instruct-v16-k65536-65536-woft",
         "bits": "2 bits"
         "name": "VPTQ-community/Meta-Llama-3.1-70B-Instruct-v8-k65536-65536-woft",
         "bits": "4 bits"
     },
     {
         "name": "VPTQ-community/Qwen2.5-72B-Instruct-v8-k65536-65536-woft",
         "bits": "4 bits"