Spaces:

cornzz
/

llmlingua-demo

Sleeping

App Files Files Community

cornzz commited on Jul 18, 2024

Commit

020cd59

1 Parent(s): 5ede078

Create gradio demo

Browse files

Files changed (6) hide show

.gitignore +3 -1
demo.py +52 -0
prompt.txt +3 -0
requirements.txt +129 -0
test.ipynb +84 -0
test.py +0 -10

.gitignore CHANGED Viewed

	@@ -1 +1,3 @@
1	- venv/

+venv/
+flagged/
+__pycache__/

demo.py ADDED Viewed

	@@ -0,0 +1,52 @@

+from llmlingua import PromptCompressor
+import gradio as gr
+import torch
+import pandas as pd
+llm_lingua = PromptCompressor(
+    model_name="microsoft/llmlingua-2-xlm-roberta-large-meetingbank",
+    use_llmlingua2=True,
+    device_map="mps" if torch.backends.mps.is_available() else "cuda" if torch.cuda.is_available() else "cpu",
+)
+def compress_prompt(prompt, rate):
+    result = llm_lingua.compress_prompt(prompt, rate=rate)
+    return (
+        result["compressed_prompt"],
+        pd.DataFrame(
+            {
+                "Original / Compressed Tokens": [f'{result["origin_tokens"]} / {result["compressed_tokens"]}'],
+                "Ratio": [result["ratio"]],
+                "Rate": [result["rate"]],
+                "Saving": [result["saving"]],
+            }
+        ),
+    )
+demo = gr.Interface(
+    fn=compress_prompt,
+    inputs=[gr.Textbox(lines=10, label="Prompt"), gr.Slider(0.1, 1, 0.5, label="Rate")],
+    outputs=[
+        gr.Textbox(lines=10, label="Compressed Prompt"),
+        gr.Dataframe(label="Metrics", headers=["Original / compressed tokens", "Ratio", "Rate", "Saving"], row_count=1),
+    ],
+    title="Prompt Compressor",
+    description="Compress a prompt using LLM-Lingua.",
+    allow_flagging="never",
+    examples=[
+        [
+            "John: So, um, I've been thinking about the project, you know, and I believe we need to, uh, make some changes. I mean, we want the project to succeed, right? So, like, I think we should consider maybe revising the timeline. Sarah: I totally agree, John. I mean, we have to be realistic, you know. The timeline is, like, too tight. You know what I mean? We should definitely extend it.",
+            0.3,
+        ],
+        [
+            "Item 15, report from City Manager Recommendation to adopt three resolutions. First, to join the Victory Pace program. Second, to join the California first program. And number three, consenting to to inclusion of certain properties within the jurisdiction in the California Hero program. It was emotion, motion, a second and public comment. CNN. Please cast your vote. Oh. Was your public comment? Yeah. Please come forward. I thank you, Mr. Mayor. Thank you. Members of the council. My name is Alex Mitchell. I represent the hero program. Just wanted to let you know that the hero program. Has been in California for the last three and a half years. We’re in. Over 20. We’re in 28 counties, and we’ve completed over 29,000 energy efficient projects to make homes. Greener and more energy efficient. And this includes anything. From solar to water. Efficiency. We’ve done. Almost.$550 million in home improvements.",
+            0.5,
+        ],
+    ],
+)
+demo.launch()

prompt.txt ADDED Viewed

	@@ -0,0 +1,3 @@


1	+ The fn argument is very flexible -- you can pass any Python function that you want to wrap with a UI. In the example above, we saw a relatively simple function, but the function could be anything from a music generator to a tax calculator to the prediction function of a pretrained machine learning model.
2	+
3	+ The inputs and outputs arguments take one or more Gradio components. As we'll see, Gradio includes more than 30 built-in components (such as the gr.Textbox(), gr.Image(), and gr.HTML() components) that are designed for machine learning applications.

requirements.txt CHANGED Viewed

@@ -1,30 +1,159 @@
 accelerate==0.32.1
 certifi==2024.7.4
 charset-normalizer==3.3.2
 click==8.1.7
 filelock==3.15.4
 fsspec==2024.6.1
 huggingface-hub==0.23.5
 idna==3.7
 Jinja2==3.1.4
 joblib==1.4.2
 llmlingua==0.2.2
 MarkupSafe==2.1.5
 mpmath==1.3.0
 networkx==3.3
 nltk==3.8.1
 numpy==1.26.4
 packaging==24.1
 psutil==6.0.0
 PyYAML==6.0.1
 regex==2024.5.15
 requests==2.32.3
 safetensors==0.4.3
 sympy==1.13.0
 tiktoken==0.7.0
 tokenizers==0.19.1
 torch==2.3.1
 tqdm==4.66.4
 transformers==4.42.4
 typing_extensions==4.12.2
 urllib3==2.2.2

 accelerate==0.32.1
+aiofiles==23.2.1
+altair==5.3.0
+annotated-types==0.7.0
+anyio==4.4.0
+appnope==0.1.4
+argon2-cffi==23.1.0
+argon2-cffi-bindings==21.2.0
+arrow==1.3.0
+asttokens==2.4.1
+async-lru==2.0.4
+attrs==23.2.0
+Babel==2.15.0
+beautifulsoup4==4.12.3
+bleach==6.1.0
 certifi==2024.7.4
+cffi==1.16.0
 charset-normalizer==3.3.2
 click==8.1.7
+comm==0.2.2
+contourpy==1.2.1
+cycler==0.12.1
+debugpy==1.8.2
+decorator==5.1.1
+defusedxml==0.7.1
+dnspython==2.6.1
+email_validator==2.2.0
+executing==2.0.1
+fastapi==0.111.1
+fastapi-cli==0.0.4
+fastjsonschema==2.20.0
+ffmpy==0.3.2
 filelock==3.15.4
+fonttools==4.53.1
+fqdn==1.5.1
 fsspec==2024.6.1
+gradio==4.38.1
+gradio_client==1.1.0
+h11==0.14.0
+httpcore==1.0.5
+httptools==0.6.1
+httpx==0.27.0
 huggingface-hub==0.23.5
 idna==3.7
+importlib_resources==6.4.0
+ipykernel==6.29.5
+ipython==8.26.0
+ipywidgets==8.1.3
+isoduration==20.11.0
+jedi==0.19.1
 Jinja2==3.1.4
 joblib==1.4.2
+json5==0.9.25
+jsonpointer==3.0.0
+jsonschema==4.23.0
+jsonschema-specifications==2023.12.1
+jupyter==1.0.0
+jupyter-console==6.6.3
+jupyter-events==0.10.0
+jupyter-lsp==2.2.5
+jupyter_client==8.6.2
+jupyter_core==5.7.2
+jupyter_server==2.14.2
+jupyter_server_terminals==0.5.3
+jupyterlab==4.2.3
+jupyterlab_pygments==0.3.0
+jupyterlab_server==2.27.3
+jupyterlab_widgets==3.0.11
+kiwisolver==1.4.5
 llmlingua==0.2.2
+markdown-it-py==3.0.0
 MarkupSafe==2.1.5
+matplotlib==3.9.1
+matplotlib-inline==0.1.7
+mdurl==0.1.2
+mistune==3.0.2
 mpmath==1.3.0
+nbclient==0.10.0
+nbconvert==7.16.4
+nbformat==5.10.4
+nest-asyncio==1.6.0
 networkx==3.3
 nltk==3.8.1
+notebook==7.2.1
+notebook_shim==0.2.4
 numpy==1.26.4
+orjson==3.10.6
+overrides==7.7.0
 packaging==24.1
+pandas==2.2.2
+pandocfilters==1.5.1
+parso==0.8.4
+pexpect==4.9.0
+pillow==10.4.0
+platformdirs==4.2.2
+prometheus_client==0.20.0
+prompt_toolkit==3.0.47
 psutil==6.0.0
+ptyprocess==0.7.0
+pure-eval==0.2.2
+pycparser==2.22
+pydantic==2.8.2
+pydantic_core==2.20.1
+pydub==0.25.1
+Pygments==2.18.0
+pyparsing==3.1.2
+python-dateutil==2.9.0.post0
+python-dotenv==1.0.1
+python-json-logger==2.0.7
+python-multipart==0.0.9
+pytz==2024.1
 PyYAML==6.0.1
+pyzmq==26.0.3
+qtconsole==5.5.2
+QtPy==2.4.1
+referencing==0.35.1
 regex==2024.5.15
 requests==2.32.3
+rfc3339-validator==0.1.4
+rfc3986-validator==0.1.1
+rich==13.7.1
+rpds-py==0.19.0
+ruff==0.5.2
 safetensors==0.4.3
+semantic-version==2.10.0
+Send2Trash==1.8.3
+shellingham==1.5.4
+six==1.16.0
+sniffio==1.3.1
+soupsieve==2.5
+stack-data==0.6.3
+starlette==0.37.2
 sympy==1.13.0
+terminado==0.18.1
 tiktoken==0.7.0
+tinycss2==1.3.0
 tokenizers==0.19.1
+tomlkit==0.12.0
+toolz==0.12.1
 torch==2.3.1
+tornado==6.4.1
 tqdm==4.66.4
+traitlets==5.14.3
 transformers==4.42.4
+typer==0.12.3
+types-python-dateutil==2.9.0.20240316
 typing_extensions==4.12.2
+tzdata==2024.1
+uri-template==1.3.0
 urllib3==2.2.2
+uvicorn==0.30.1
+uvloop==0.19.0
+watchfiles==0.22.0
+wcwidth==0.2.13
+webcolors==24.6.0
+webencodings==0.5.1
+websocket-client==1.8.0
+websockets==11.0.3
+widgetsnbextension==4.0.11

test.ipynb ADDED Viewed

	@@ -0,0 +1,84 @@

+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from llmlingua import PromptCompressor"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "llm_lingua = PromptCompressor(\n",
+    "    model_name=\"microsoft/llmlingua-2-xlm-roberta-large-meetingbank\",\n",
+    "    use_llmlingua2=True,\n",
+    "    device_map=\"mps\"\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "compressed_prompt The fn argument is very flexible -- you can pass any Python function that you want to wrap with a UI. In the example above, we saw a relatively simple function, but the function could be anything from a music generator to a tax calculator to the prediction function of a pretrained machine learning model. The inputs and outputs arguments take one or more Gradio components. As we'll see, Gradio includes more than 30 built-in components (such as the gr.Textbox(), gr.Image(), and gr.HTML() components) that are designed for machine learning applications.\n",
+      "compressed_prompt_list [\"The fn argument is very flexible -- you can pass any Python function that you want to wrap with a UI. In the example above, we saw a relatively simple function, but the function could be anything from a music generator to a tax calculator to the prediction function of a pretrained machine learning model. The inputs and outputs arguments take one or more Gradio components. As we'll see, Gradio includes more than 30 built-in components (such as the gr.Textbox(), gr.Image(), and gr.HTML() components) that are designed for machine learning applications.\"]\n",
+      "origin_tokens 113\n",
+      "compressed_tokens 112\n",
+      "ratio 1.0x\n",
+      "rate 99.1%\n",
+      "saving , Saving $0.0 in GPT-4.\n"
+     ]
+    },
+    {
+     "ename": "",
+     "evalue": "",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[1;31mThe Kernel crashed while executing code in the current cell or a previous cell. \n",
+      "\u001b[1;31mPlease review the code in the cell(s) to identify a possible cause of the failure. \n",
+      "\u001b[1;31mClick <a href='https://aka.ms/vscodeJupyterKernelCrash'>here</a> for more info. \n",
+      "\u001b[1;31mView Jupyter <a href='command:jupyter.viewOutput'>log</a> for further details."
+     ]
+    }
+   ],
+   "source": [
+    "with open(\"prompt.txt\", \"r\") as file:\n",
+    "    prompt = file.read()\n",
+    "    compressed_prompt = llm_lingua.compress_prompt(prompt, rate=1)\n",
+    "    [print(\": \".join(entry)) for entry in compressed_prompt.items()]"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.6"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}

test.py DELETED Viewed

@@ -1,10 +0,0 @@
-from llmlingua import PromptCompressor
-llm_lingua = PromptCompressor(
-    model_name="microsoft/llmlingua-2-xlm-roberta-large-meetingbank",
-    use_llmlingua2=True,
-    device_map="mps"
-)
-compressed_prompt = llm_lingua.compress_prompt("The meeting was scheduled for 2:30 PM, but it started at 3:00 PM. Why?", rate=0.5)
-print(compressed_prompt)