Spaces:
Sleeping
Sleeping
import gradio as gr | |
import pandas as pd | |
import requests | |
import json | |
from datasets import load_dataset | |
#dataset = load_dataset("nlphuji/flickr30k", split="test[10:20]") | |
#print (dataset) | |
#headers = {"Authorization": f"Bearer {API_TOKEN}"} | |
def query1(fetch_url): | |
if fetch_url=="": | |
fetch_url = "nlphuji/flickr30k" | |
API_URL1 = f"https://datasets-server.huggingface.co/splits?dataset={fetch_url}" | |
response = requests.get(API_URL1) | |
json_obj=response.json() | |
config_box = [] | |
split_box = [] | |
for obj in json_obj: | |
print (obj) | |
if obj == "splits": | |
try: | |
for split in json_obj[obj]: | |
print (f'split: {split}') | |
out_config = split['config'] | |
out_split = split['split'] | |
print (out_config) | |
print (out_split) | |
config_box.append(out_config) | |
split_box.append(out_split) | |
except Exception as e: | |
print (e) | |
pass | |
#df = pd.DataFrame.from_dict(json_obj) | |
return json_obj,gr.update(choices=[c for c in config_box]),gr.update(choices=[s for s in split_box]) | |
def query2(fetch_url,config="TEST",split="test",offset=0,length=10): | |
if fetch_url=="": | |
fetch_url = "nlphuji/flickr30k" | |
#offset=0 | |
#length=10 | |
API_URL2 = f"https://datasets-server.huggingface.co/rows?dataset={fetch_url}&config={config}&split={split}&offset={offset}&length={length}" | |
response = requests.get(API_URL2) | |
dictionary=response.json() | |
#print (len(dictionary)) | |
lvl_1=[] | |
for key in dictionary: | |
lvl_1.append(key) | |
print (key) | |
return dictionary,gr.update(choices=[l for l in lvl_1]) | |
def find_fn(lvl_1,lvl_2,fetch_url,config="TEST",split="test",offset=0,length=10): | |
#print(out_json['rows']) | |
#print (inp) | |
img_list=[] | |
out_json,_=query2(fetch_url,config,split,offset=10,length=20) | |
lvl_1=lvl_1.strip("[]") | |
lvl_2=lvl_2.strip('""').strip("''") | |
#print(inp) | |
cnt_lvl = "" | |
if lvl_2 != "": | |
ea_lvl_len = len(lvl_2) | |
print (ea_lvl_len) | |
for ea_lvl in lvl_2: | |
cnt_lvl = f'{cnt_lvl}[{ea_lvl}]' | |
for ea in out_json[f"{lvl_1}"]: | |
cnt_lvl=cnt_lvl.strip("[]") | |
#img_ea = ea['row']['image']['src'] | |
img_list.append(ea[f"{cnt_lvl}"]) | |
if lvl_2 == "": | |
img_list.append(out_json[lvl_1]) | |
return img_list | |
def upd_drop(lvl_1=None,lvl_2=None,lvl_3=None,lvl_4=None,lvl_5=None,fetch_url="",config="TEST",split="test",offset=0,length=10): | |
out_json,_=query2(fetch_url,config,split,offset=10,length=20) | |
box_1=[] | |
box_2=[] | |
box_3=[] | |
box_4=[] | |
box_5=[] | |
out1=None | |
out2=None | |
out3=None | |
out4=None | |
if lvl_1 == "rows": | |
lvl_src= out_json[lvl_1][0] | |
else: | |
lvl_src=out_json[lvl_1] | |
print (f"lvl_src:: {lvl_src}") | |
if lvl_1 !="" and lvl_1 != None: | |
for ea in (lvl_src): | |
box_1.append(ea) | |
out= gr.update(choices = [m for m in box_1]) | |
if lvl_2 !="" and lvl_2 != None: | |
for ea in (lvl_src[lvl_2]): | |
print (ea) | |
box_2.append(ea) | |
out= gr.update(choices = [m for m in box_2]) | |
else: | |
pass | |
if lvl_3 !="" and lvl_3 != None: | |
for ea in (lvl_src): | |
box_3.append(ea[lvl_2][lvl_3]) | |
out= gr.update(choices = [m for m in box_3]) | |
else: | |
pass | |
if lvl_4 !="" and lvl_4 != None: | |
for ea in (lvl_src): | |
box_4.append(ea[lvl_2][lvl_3][lvl_4]) | |
out= gr.update(choices = [m for m in box_4]) | |
else: | |
pass | |
return out | |
def find_items(lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,fetch_url,config="TEST",split="test",offset=0,length=10): | |
out_json,_=query2(fetch_url,config,split,offset=10,length=20) | |
box_1=[] | |
box_2=[] | |
box_3=[] | |
box_4=[] | |
box_5=[] | |
if lvl_1 !="": | |
for ea in (out_json[lvl_1]): | |
box_1.append(ea) | |
out = box_1 | |
if lvl_2 !="": | |
for ea in (out_json[lvl_1]): | |
box_2.append(ea[lvl_2]) | |
out = box_2 | |
if lvl_3 !="": | |
for ea in (out_json[lvl_1]): | |
box_3.append(ea[lvl_2][lvl_3]) | |
out = box_3 | |
if lvl_4 !="": | |
for ea in (out_json[lvl_1]): | |
box_4.append(ea[lvl_2][lvl_3][lvl_4]) | |
out = box_4 | |
if lvl_5 !="": | |
for ea in (out_json[lvl_1]): | |
box_5.append(ea[lvl_2][lvl_3][lvl_4][lvl_5]) | |
out = box_5 | |
return out | |
def img_fn(inp): | |
img_box=[] | |
for img in inp: | |
out = Image.open(inp) | |
img_box.append(out) | |
return img_box | |
with gr.Blocks() as app: | |
with gr.Box(): | |
with gr.Row(): | |
with gr.Column(scale=3): | |
with gr.Row(): | |
data_set_url=gr.Textbox(label="Dataset (repo/name)") | |
fetch_btn=gr.Button() | |
with gr.Row(): | |
config_set=gr.Dropdown(label="Config") | |
split_set=gr.Dropdown(label="Split") | |
#config_drop = gr.Dropdown(label="Config/Split", choices=[]) | |
view_data=gr.Button(label="View") | |
with gr.Row(): | |
lvl_1=gr.Dropdown(label="lvl_1") | |
lvl_2=gr.Dropdown(label="lvl_2") | |
lvl_3=gr.Dropdown(label="lvl_3") | |
lvl_4=gr.Dropdown(label="lvl_4") | |
lvl_5=gr.Dropdown(label="lvl_5") | |
find_btn=gr.Button("Search") | |
with gr.Tab("JSON"): | |
out_find = gr.JSON() | |
with gr.Tab("Gallery"): | |
gal_btn=gr.Button("Load Images") | |
out_gal = gr.Gallery() | |
with gr.Column(scale=1): | |
out_json = gr.JSON() | |
lvl_1.change(upd_drop,[lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,data_set_url,config_set,split_set],[lvl_2]) | |
lvl_2.change(upd_drop,[lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,data_set_url,config_set,split_set],[lvl_3]) | |
lvl_3.change(upd_drop,[lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,data_set_url,config_set,split_set],[lvl_4]) | |
lvl_4.change(upd_drop,[lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,data_set_url,config_set,split_set],[lvl_5]) | |
find_btn.click(find_items,[lvl_1,lvl_2,lvl_3,lvl_4,lvl_5,data_set_url,config_set,split_set],out_find) | |
view_data.click(query2,[data_set_url,config_set,split_set],[out_find,lvl_1]) | |
gal_btn.click(img_fn,out_find,out_gal) | |
#find_btn.click(find_fn,[lvl_1,lvl_2,data_set_url,config_set,split_set],[out_find]) | |
fetch_btn.click(query1,data_set_url,[out_json,config_set,split_set]) | |
app.launch() |