Spaces:
Sleeping
Sleeping
Create app.py
Browse files
app.py
ADDED
@@ -0,0 +1,39 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
|
2 |
+
|
3 |
+
# import module
|
4 |
+
import streamlit as st
|
5 |
+
|
6 |
+
import datasets
|
7 |
+
|
8 |
+
import pandas as pd
|
9 |
+
|
10 |
+
access_token=""
|
11 |
+
dataset=""
|
12 |
+
split=""
|
13 |
+
skip=0
|
14 |
+
|
15 |
+
column_with_audio="audio_transcription"
|
16 |
+
column_with_english_text="en"
|
17 |
+
column_with_other_text="transcription"
|
18 |
+
|
19 |
+
def load():
|
20 |
+
ds = datasets.load_dataset(dataset, token=access_token, split=datasets.ReadInstruction("test",from_=skip,to=skip+50))
|
21 |
+
for example in ds:
|
22 |
+
df=pd.DataFrame([example[column_with_other_text],example[column_with_english_text]])
|
23 |
+
st.table(df.values)
|
24 |
+
st.audio(example[column_with_audio]["array"],sample_rate=example[column_with_audio]["sampling_rate"])
|
25 |
+
|
26 |
+
# Title
|
27 |
+
st.title("One Talk dataset explorer")
|
28 |
+
|
29 |
+
access_token = st.text_input("Access token", value="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", max_chars=None, key=None, type="default")
|
30 |
+
dataset = st.text_input("Dataset", value="nlewins/onetalk_questions_full_audio", max_chars=None, key=None, type="default")
|
31 |
+
split = st.text_input("Split", value="test", max_chars=None, key=None, type="default")
|
32 |
+
skip = st.number_input("Skip", value=50)
|
33 |
+
|
34 |
+
st.button("Go",on_click=load)
|
35 |
+
|
36 |
+
st.divider()
|
37 |
+
|
38 |
+
load()
|
39 |
+
|