bleysg commited on
Commit
6c44a5d
β€’
1 Parent(s): 38bd567

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -4
app.py CHANGED
@@ -121,7 +121,8 @@ with gr.Blocks(css=CSS) as demo:
121
  with gr.Row():
122
  with gr.Column():
123
  gr.Markdown(f"""
124
- ## This demo is an unquantized GPU chatbot of [WizardCoder-Python-34B-V1.0-GGUF](https://huggingface.co/TheBloke/WizardCoder-Python-34B-V1.0-GGUF)
 
125
  """)
126
  with gr.Row():
127
  gr.Markdown("# πŸ” WizardCoder-Python-34B-V1.0-GGUF Playground Space! πŸ”Ž")
@@ -145,9 +146,9 @@ with gr.Blocks(css=CSS) as demo:
145
  with gr.Row():
146
  with gr.Column():
147
  max_tokens = gr.Slider(20, 4000, label="Max Tokens", step=20, value=2000)
148
- temperature = gr.Slider(0.0, 2.0, label="Temperature", step=0.1, value=0.8)
149
- top_p = gr.Slider(0.0, 1.0, label="Top P", step=0.02, value=0.95)
150
- top_k = gr.Slider(-1, 100, label="Top K", step=1, value=40)
151
  repetition_penalty = gr.Slider(0.0, 2.0, label="Repetition Penalty", step=0.05, value=1.1)
152
 
153
  system_msg = gr.Textbox(
 
121
  with gr.Row():
122
  with gr.Column():
123
  gr.Markdown(f"""
124
+ ## This demo is a quantized GPU chatbot of [WizardCoder-Python-34B-V1.0-GGUF](https://huggingface.co/TheBloke/WizardCoder-Python-34B-V1.0-GGUF)
125
+ It runs two different quantization levels in parallel for comparison. Best run at temperature 0.
126
  """)
127
  with gr.Row():
128
  gr.Markdown("# πŸ” WizardCoder-Python-34B-V1.0-GGUF Playground Space! πŸ”Ž")
 
146
  with gr.Row():
147
  with gr.Column():
148
  max_tokens = gr.Slider(20, 4000, label="Max Tokens", step=20, value=2000)
149
+ temperature = gr.Slider(0.0, 2.0, label="Temperature", step=0.1, value=0.0)
150
+ top_p = gr.Slider(0.0, 1.0, label="Top P", step=0.02, value=1.0)
151
+ top_k = gr.Slider(-1, 100, label="Top K", step=1, value=0)
152
  repetition_penalty = gr.Slider(0.0, 2.0, label="Repetition Penalty", step=0.05, value=1.1)
153
 
154
  system_msg = gr.Textbox(