abdullahmeda commited on
Commit
bbead68
·
1 Parent(s): 0433b53
Files changed (2) hide show
  1. app.py +8 -7
  2. datasets/sample_100k_lines.json.gz +3 -0
app.py CHANGED
@@ -3,10 +3,11 @@ from cw2 import *
3
 
4
  data_tiny = pd.read_json('datasets/sample_tiny.json', lines=True)
5
  data_small = pd.read_json('datasets/sample_small.json', lines=True)
6
- # data_100k_lines = pd.read_json('datasets/sample_100k_lines.json', lines=True)
7
- # data_400k_lines = pd.read_json('datasets/sample_400k_lines.json', lines=True)
 
8
 
9
- for dataset in [data_tiny, data_small]:#, data_100k_lines, data_400k_lines]:
10
  dataset['visitor_continent'] = dataset['visitor_country'].apply(country_code_to_continent)
11
 
12
 
@@ -51,7 +52,7 @@ with gr.Blocks(css="""
51
  with gr.Column(scale=1, variant='panel', elem_id="space_between"):
52
  t2a_doc_uuid = gr.Textbox(value="140228101942-d4c9bd33cc299cc53d584ca1a4bf15d9", label="Enter document UUID:")
53
  selected_dataset = gr.Radio(label="Choose dataset size:",
54
- choices=['tiny', 'small', '100k_lines', '400k_lines'],
55
  interactive=True,
56
  value='small')
57
  req_1_submit = gr.Button(value="Generate graphs", elem_id="submit_button")
@@ -71,7 +72,7 @@ with gr.Blocks(css="""
71
  with gr.Row():
72
  with gr.Column(scale=1, variant='panel', elem_id="space_between"):
73
  selected_dataset_3 = gr.Radio(label="Choose dataset size:",
74
- choices=['tiny', 'small', '100k_lines', '400k_lines'],
75
  interactive=True,
76
  value='small')
77
  with gr.Row():
@@ -90,7 +91,7 @@ with gr.Blocks(css="""
90
  with gr.Row():
91
  with gr.Column(scale=1, variant='panel', elem_id="space_between"):
92
  selected_dataset_4 = gr.Radio(label="Choose dataset size:",
93
- choices=['tiny', 'small', '100k_lines', '400k_lines'],
94
  interactive=True,
95
  value='small')
96
  with gr.Row():
@@ -114,7 +115,7 @@ with gr.Blocks(css="""
114
  with gr.Row():
115
  with gr.Column(scale=1, variant='panel', elem_id="space_between"):
116
  selected_dataset_5 = gr.Radio(label="Choose dataset size:",
117
- choices=['tiny', 'small', '100k_lines', '400k_lines'],
118
  interactive=True,
119
  value='small')
120
  t5_doc_uuid = gr.Textbox(value="100713205147-2ee05a98f1794324952eea5ca678c026", label="Enter document UUID:")
 
3
 
4
  data_tiny = pd.read_json('datasets/sample_tiny.json', lines=True)
5
  data_small = pd.read_json('datasets/sample_small.json', lines=True)
6
+ data_100k_lines = pd.read_json('datasets/sample_100k_lines.json.gz', lines=True, compression='gzip')
7
+ data_400k_lines = pd.read_json('datasets/sample_400k_lines.json.gz', lines=True, compression='gzip')
8
+ data_600k_lines = pd.read_json('datasets/sample_600k_lines.json.gz', lines=True, compression='gzip')
9
 
10
+ for dataset in [data_tiny, data_small, data_100k_lines, data_400k_lines, data_600k_lines]:
11
  dataset['visitor_continent'] = dataset['visitor_country'].apply(country_code_to_continent)
12
 
13
 
 
52
  with gr.Column(scale=1, variant='panel', elem_id="space_between"):
53
  t2a_doc_uuid = gr.Textbox(value="140228101942-d4c9bd33cc299cc53d584ca1a4bf15d9", label="Enter document UUID:")
54
  selected_dataset = gr.Radio(label="Choose dataset size:",
55
+ choices=['tiny', 'small', '100k_lines', '400k_lines', '600k_lines'],
56
  interactive=True,
57
  value='small')
58
  req_1_submit = gr.Button(value="Generate graphs", elem_id="submit_button")
 
72
  with gr.Row():
73
  with gr.Column(scale=1, variant='panel', elem_id="space_between"):
74
  selected_dataset_3 = gr.Radio(label="Choose dataset size:",
75
+ choices=['tiny', 'small', '100k_lines', '400k_lines', '600k_lines'],
76
  interactive=True,
77
  value='small')
78
  with gr.Row():
 
91
  with gr.Row():
92
  with gr.Column(scale=1, variant='panel', elem_id="space_between"):
93
  selected_dataset_4 = gr.Radio(label="Choose dataset size:",
94
+ choices=['tiny', 'small', '100k_lines', '400k_lines', '600k_lines'],
95
  interactive=True,
96
  value='small')
97
  with gr.Row():
 
115
  with gr.Row():
116
  with gr.Column(scale=1, variant='panel', elem_id="space_between"):
117
  selected_dataset_5 = gr.Radio(label="Choose dataset size:",
118
+ choices=['tiny', 'small', '100k_lines', '400k_lines', '600k_lines'],
119
  interactive=True,
120
  value='small')
121
  t5_doc_uuid = gr.Textbox(value="100713205147-2ee05a98f1794324952eea5ca678c026", label="Enter document UUID:")
datasets/sample_100k_lines.json.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4863c1c55572a940d0ce4bfb9edb89dfc9106028b58370d1f24d8afb8f48384
3
+ size 3780560