nlewins commited on
Commit
b98062a
1 Parent(s): eef5333

Create app.py

Browse files
Files changed (1) hide show
  1. app.py +39 -0
app.py ADDED
@@ -0,0 +1,39 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+
2
+
3
+ # import module
4
+ import streamlit as st
5
+
6
+ import datasets
7
+
8
+ import pandas as pd
9
+
10
+ access_token=""
11
+ dataset=""
12
+ split=""
13
+ skip=0
14
+
15
+ column_with_audio="audio_transcription"
16
+ column_with_english_text="en"
17
+ column_with_other_text="transcription"
18
+
19
+ def load():
20
+ ds = datasets.load_dataset(dataset, token=access_token, split=datasets.ReadInstruction("test",from_=skip,to=skip+50))
21
+ for example in ds:
22
+ df=pd.DataFrame([example[column_with_other_text],example[column_with_english_text]])
23
+ st.table(df.values)
24
+ st.audio(example[column_with_audio]["array"],sample_rate=example[column_with_audio]["sampling_rate"])
25
+
26
+ # Title
27
+ st.title("One Talk dataset explorer")
28
+
29
+ access_token = st.text_input("Access token", value="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", max_chars=None, key=None, type="default")
30
+ dataset = st.text_input("Dataset", value="nlewins/onetalk_questions_full_audio", max_chars=None, key=None, type="default")
31
+ split = st.text_input("Split", value="test", max_chars=None, key=None, type="default")
32
+ skip = st.number_input("Skip", value=50)
33
+
34
+ st.button("Go",on_click=load)
35
+
36
+ st.divider()
37
+
38
+ load()
39
+