Spaces:
Running
on
Zero
Running
on
Zero
jadechoghari
commited on
Commit
•
ee59173
1
Parent(s):
35f0b0b
remove users images and update readme
Browse files- Screenshot 2024-10-24 at 19.50.06.png +0 -3
- Screenshot 2024-10-24 at 19.52.12.png +0 -3
- app.py +10 -1
- clipboard.png +0 -3
- Новый проект 1.png +0 -3
- Новый проект 4.png +0 -3
Screenshot 2024-10-24 at 19.50.06.png
DELETED
Git LFS Details
|
Screenshot 2024-10-24 at 19.52.12.png
DELETED
Git LFS Details
|
app.py
CHANGED
@@ -72,7 +72,7 @@ html = f"""
|
|
72 |
style='width: 80px; height: 80px; border-radius: 20px; box-shadow: 0px 8px 16px rgba(0, 0, 0, 0.2);'/>
|
73 |
<div style="margin-left: 15px;">
|
74 |
<h1 style="font-size: 2.8em; font-family: -apple-system, BlinkMacSystemFont, sans-serif; color: #1D1D1F;
|
75 |
-
font-weight: bold; margin-bottom: 0;"
|
76 |
<p style="font-size: 1.2em; color: #6e6e73; font-family: -apple-system, BlinkMacSystemFont, sans-serif; margin-top: 5px;">
|
77 |
📱 Grounded Mobile UI Understanding with Multimodal LLMs.<br>
|
78 |
A new MLLM tailored for enhanced understanding of mobile UI screens, equipped with referring, grounding, and reasoning capabilities.
|
@@ -123,6 +123,15 @@ with gr.Blocks(title=model_name) as demo:
|
|
123 |
temperature_input = gr.Slider(minimum=0.1, maximum=2.0, step=0.1, value=0.2, label="Temperature")
|
124 |
top_p_input = gr.Slider(minimum=0.0, maximum=1.0, step=0.05, value=0.7, label="Top P")
|
125 |
max_new_tokens_input = gr.Slider(minimum=1, maximum=1024, step=1, value=512, label="Max New Tokens")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
126 |
|
127 |
with gr.Column(scale=7):
|
128 |
chatbot = gr.Chatbot(
|
|
|
72 |
style='width: 80px; height: 80px; border-radius: 20px; box-shadow: 0px 8px 16px rgba(0, 0, 0, 0.2);'/>
|
73 |
<div style="margin-left: 15px;">
|
74 |
<h1 style="font-size: 2.8em; font-family: -apple-system, BlinkMacSystemFont, sans-serif; color: #1D1D1F;
|
75 |
+
font-weight: bold; margin-bottom: 0;"> {model_name}</h1>
|
76 |
<p style="font-size: 1.2em; color: #6e6e73; font-family: -apple-system, BlinkMacSystemFont, sans-serif; margin-top: 5px;">
|
77 |
📱 Grounded Mobile UI Understanding with Multimodal LLMs.<br>
|
78 |
A new MLLM tailored for enhanced understanding of mobile UI screens, equipped with referring, grounding, and reasoning capabilities.
|
|
|
123 |
temperature_input = gr.Slider(minimum=0.1, maximum=2.0, step=0.1, value=0.2, label="Temperature")
|
124 |
top_p_input = gr.Slider(minimum=0.0, maximum=1.0, step=0.05, value=0.7, label="Top P")
|
125 |
max_new_tokens_input = gr.Slider(minimum=1, maximum=1024, step=1, value=512, label="Max New Tokens")
|
126 |
+
|
127 |
+
gr.Examples(
|
128 |
+
examples=[
|
129 |
+
[{"image": "appstore_reminders.png"}, "Describe the contents inside the box"],
|
130 |
+
[{"image": "appstore_reminders.png"}, "What is the text shown inside the highlighted area"]
|
131 |
+
],
|
132 |
+
inputs=[image_input, text_input],
|
133 |
+
label="Try these examples"
|
134 |
+
)
|
135 |
|
136 |
with gr.Column(scale=7):
|
137 |
chatbot = gr.Chatbot(
|
clipboard.png
DELETED
Git LFS Details
|
Новый проект 1.png
DELETED
Git LFS Details
|
Новый проект 4.png
DELETED
Git LFS Details
|