Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -53,7 +53,8 @@ with gr.Blocks(css="#b {min-width:15px;background:transparent;}") as demo: #bord
|
|
53 |
with gr.Row():
|
54 |
gr.Markdown(value="""## <p style="text-align: center;"> Code search </p>""")
|
55 |
with gr.Row():
|
56 |
-
|
|
|
57 |
with gr.Row():
|
58 |
with gr.Column(scale=1):
|
59 |
result_list = gr.Dataframe(type="array", visible=False, col_count=1)
|
|
|
53 |
with gr.Row():
|
54 |
gr.Markdown(value="""## <p style="text-align: center;"> Code search </p>""")
|
55 |
with gr.Row():
|
56 |
+
gr.Markdown("This search tool was used to validate tokenization scheme for code retrieval for the BigCode project. We indexed the [Santacoder](https://huggingface.co/bigcode/santacoder) training dataset (Python, Java, and JavaScript) and use a (2,4)-gram tokenizer to build the index. This is the same tokenization scheme that ended up being used to index the [StarCoder](https://huggingface.co/spaces/bigcode/search) dataset.")
|
57 |
+
|
58 |
with gr.Row():
|
59 |
with gr.Column(scale=1):
|
60 |
result_list = gr.Dataframe(type="array", visible=False, col_count=1)
|