dataset-viewer / app.py
Omnibus's picture
Update app.py
f0e40c4
raw
history blame
6.72 kB
import gradio as gr
import pandas as pd
import requests
import json
from datasets import load_dataset
#dataset = load_dataset("nlphuji/flickr30k", split="test[10:20]")
#print (dataset)
#headers = {"Authorization": f"Bearer {API_TOKEN}"}
def query1(fetch_url):
if fetch_url=="":
fetch_url = "nlphuji/flickr30k"
API_URL1 = f"https://datasets-server.huggingface.co/splits?dataset={fetch_url}"
response = requests.get(API_URL1)
json_obj=response.json()
config_box = []
split_box = []
for obj in json_obj:
print (obj)
if obj == "splits":
try:
for split in json_obj[obj]:
print (f'split: {split}')
out_config = split['config']
out_split = split['split']
print (out_config)
print (out_split)
config_box.append(out_config)
split_box.append(out_split)
except Exception as e:
print (e)
pass
#df = pd.DataFrame.from_dict(json_obj)
return json_obj,gr.update(choices=[c for c in config_box]),gr.update(choices=[s for s in split_box])
def query2(fetch_url,config="TEST",split="test",offset=0,length=10):
if fetch_url=="":
fetch_url = "nlphuji/flickr30k"
#offset=0
#length=10
API_URL2 = f"https://datasets-server.huggingface.co/rows?dataset={fetch_url}&config={config}&split={split}&offset={offset}&length={length}"
response = requests.get(API_URL2)
dictionary=response.json()
#print (len(dictionary))
lvl_1=[]
for key in dictionary:
lvl_1.append(key)
print (key)
return dictionary,gr.update(choices=[l for l in lvl_1])
def find_fn(lvl_1,lvl_2,fetch_url,config="TEST",split="test",offset=0,length=10):
#print(out_json['rows'])
#print (inp)
img_list=[]
out_json,_=query2(fetch_url,config,split,offset=10,length=20)
lvl_1=lvl_1.strip("[]")
lvl_2=lvl_2.strip('""').strip("''")
#print(inp)
cnt_lvl = ""
if lvl_2 != "":
ea_lvl_len = len(lvl_2)
print (ea_lvl_len)
for ea_lvl in lvl_2:
cnt_lvl = f'{cnt_lvl}[{ea_lvl}]'
for ea in out_json[f"{lvl_1}"]:
cnt_lvl=cnt_lvl.strip("[]")
#img_ea = ea['row']['image']['src']
img_list.append(ea[f"{cnt_lvl}"])
if lvl_2 == "":
img_list.append(out_json[lvl_1])
return img_list
def upd_drop(lvl_1=None,lvl_2=None,lvl_3=None,lvl_4=None,lvl_5=None,fetch_url="",config="TEST",split="test",offset=0,length=10):
out_json,_=query2(fetch_url,config,split,offset=10,length=20)
box_1=[]
box_2=[]
box_3=[]
box_4=[]
box_5=[]
out1=None
out2=None
out3=None
out4=None
if lvl_1 == "rows":
lvl_src= out_json[lvl_1][0]
else:
lvl_src=out_json[lvl_1]
print (f"lvl_src:: {lvl_src}")
if lvl_1 !="" and lvl_1 != None:
for ea in (lvl_src):
box_1.append(ea)
out= gr.update(choices = [m for m in box_1])
if lvl_2 !="" and lvl_2 != None:
for ea in (lvl_src[lvl_2]):
print (ea)
box_2.append(ea)
out= gr.update(choices = [m for m in box_2])
else:
pass
if lvl_3 !="" and lvl_3 != None:
for ea in (lvl_src):
box_3.append(ea[lvl_2][lvl_3])
out= gr.update(choices = [m for m in box_3])
else:
pass
if lvl_4 !="" and lvl_4 != None:
for ea in (lvl_src):
box_4.append(ea[lvl_2][lvl_3][lvl_4])
out= gr.update(choices = [m for m in box_4])
else:
pass
return out
def find_items(lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,fetch_url,config="TEST",split="test",offset=0,length=10):
out_json,_=query2(fetch_url,config,split,offset=10,length=20)
box_1=[]
box_2=[]
box_3=[]
box_4=[]
box_5=[]
if lvl_1 !="":
for ea in (out_json[lvl_1]):
box_1.append(ea)
out = box_1
if lvl_2 !="":
for ea in (out_json[lvl_1]):
box_2.append(ea[lvl_2])
out = box_2
if lvl_3 !="":
for ea in (out_json[lvl_1]):
box_3.append(ea[lvl_2][lvl_3])
out = box_3
if lvl_4 !="":
for ea in (out_json[lvl_1]):
box_4.append(ea[lvl_2][lvl_3][lvl_4])
out = box_4
if lvl_5 !="":
for ea in (out_json[lvl_1]):
box_5.append(ea[lvl_2][lvl_3][lvl_4][lvl_5])
out = box_5
return out
def img_fn(inp):
img_box=[]
for img in inp:
out = Image.open(inp)
img_box.append(out)
return img_box
with gr.Blocks() as app:
with gr.Box():
with gr.Row():
with gr.Column(scale=3):
with gr.Row():
data_set_url=gr.Textbox(label="Dataset (repo/name)")
fetch_btn=gr.Button()
with gr.Row():
config_set=gr.Dropdown(label="Config")
split_set=gr.Dropdown(label="Split")
#config_drop = gr.Dropdown(label="Config/Split", choices=[])
view_data=gr.Button(label="View")
with gr.Row():
lvl_1=gr.Dropdown(label="lvl_1")
lvl_2=gr.Dropdown(label="lvl_2")
lvl_3=gr.Dropdown(label="lvl_3")
lvl_4=gr.Dropdown(label="lvl_4")
lvl_5=gr.Dropdown(label="lvl_5")
find_btn=gr.Button("Search")
with gr.Tab("JSON"):
out_find = gr.JSON()
with gr.Tab("Gallery"):
gal_btn=gr.Button("Load Images")
out_gal = gr.Gallery()
with gr.Column(scale=1):
out_json = gr.JSON()
lvl_1.change(upd_drop,[lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,data_set_url,config_set,split_set],[lvl_2])
lvl_2.change(upd_drop,[lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,data_set_url,config_set,split_set],[lvl_3])
lvl_3.change(upd_drop,[lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,data_set_url,config_set,split_set],[lvl_4])
lvl_4.change(upd_drop,[lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,data_set_url,config_set,split_set],[lvl_5])
find_btn.click(find_items,[lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,data_set_url,config_set,split_set],out_find)
view_data.click(query2,[data_set_url,config_set,split_set],[out_find,lvl_1])
gal_btn.click(img_fn,out_find,out_gal)
#find_btn.click(find_fn,[lvl_1,lvl_2,data_set_url,config_set,split_set],[out_find])
fetch_btn.click(query1,data_set_url,[out_json,config_set,split_set])
app.launch()