Spaces:
Running
Running
David Pomerenke
commited on
Commit
·
a9e6b9b
1
Parent(s):
603effe
Improve plots and dataset table
Browse files
frontend/src/components/DatasetTable.js
CHANGED
|
@@ -140,13 +140,13 @@ const DatasetTable = ({ data }) => {
|
|
| 140 |
body={linkBodyTemplate}
|
| 141 |
/>
|
| 142 |
<Column
|
| 143 |
-
field='
|
| 144 |
-
header='
|
|
|
|
| 145 |
filter
|
| 146 |
-
|
| 147 |
-
|
| 148 |
-
|
| 149 |
-
body={tasksBodyTemplate}
|
| 150 |
/>
|
| 151 |
<Column
|
| 152 |
field='translation'
|
|
@@ -158,13 +158,13 @@ const DatasetTable = ({ data }) => {
|
|
| 158 |
body={translationBodyTemplate}
|
| 159 |
/>
|
| 160 |
<Column
|
| 161 |
-
field='
|
| 162 |
-
header='
|
| 163 |
-
headerTooltip='Number of languages in the dataset'
|
| 164 |
filter
|
| 165 |
-
|
| 166 |
-
|
| 167 |
-
|
|
|
|
| 168 |
/>
|
| 169 |
</DataTable>
|
| 170 |
)
|
|
|
|
| 140 |
body={linkBodyTemplate}
|
| 141 |
/>
|
| 142 |
<Column
|
| 143 |
+
field='n_languages'
|
| 144 |
+
header='Languages'
|
| 145 |
+
headerTooltip='Number of languages in the dataset'
|
| 146 |
filter
|
| 147 |
+
sortable
|
| 148 |
+
style={{ minWidth: '5rem', maxWidth: '10rem' }}
|
| 149 |
+
body={nLanguagesBodyTemplate}
|
|
|
|
| 150 |
/>
|
| 151 |
<Column
|
| 152 |
field='translation'
|
|
|
|
| 158 |
body={translationBodyTemplate}
|
| 159 |
/>
|
| 160 |
<Column
|
| 161 |
+
field='tasks'
|
| 162 |
+
header='Tasks'
|
|
|
|
| 163 |
filter
|
| 164 |
+
filterElement={tasksRowFilterTemplate}
|
| 165 |
+
showFilterMatchModes={false}
|
| 166 |
+
style={{ minWidth: '10rem', maxWidth: '15rem' }}
|
| 167 |
+
body={tasksBodyTemplate}
|
| 168 |
/>
|
| 169 |
</DataTable>
|
| 170 |
)
|
frontend/src/components/LanguagePlot.js
CHANGED
|
@@ -3,32 +3,46 @@ import * as Plot from '@observablehq/plot'
|
|
| 3 |
|
| 4 |
const LanguagePlot = ({ data }) => {
|
| 5 |
const containerRef = useRef()
|
| 6 |
-
const languages = data.language_table.filter
|
| 7 |
const families = [...new Set(languages.map(a => a.family))]
|
| 8 |
|
| 9 |
useEffect(() => {
|
| 10 |
const plot = Plot.plot({
|
| 11 |
width: 750,
|
| 12 |
height: 500,
|
| 13 |
-
|
| 14 |
x: {
|
| 15 |
label: 'Number of Speakers',
|
| 16 |
type: 'log'
|
| 17 |
},
|
| 18 |
y: {
|
| 19 |
-
label: 'Language Proficiency Score'
|
| 20 |
},
|
| 21 |
marks: [
|
| 22 |
Plot.dot(languages, {
|
| 23 |
x: 'speakers',
|
| 24 |
y: d => d.average,
|
| 25 |
-
r:
|
| 26 |
fill: 'family',
|
| 27 |
-
|
| 28 |
-
|
|
|
|
|
|
|
| 29 |
tip: true
|
| 30 |
}),
|
| 31 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 32 |
})
|
| 33 |
containerRef.current.append(plot)
|
| 34 |
return () => plot.remove()
|
|
@@ -42,7 +56,7 @@ const LanguagePlot = ({ data }) => {
|
|
| 42 |
height: '100%',
|
| 43 |
display: 'flex',
|
| 44 |
alignItems: 'center',
|
| 45 |
-
justifyContent: 'center'
|
| 46 |
}}
|
| 47 |
/>
|
| 48 |
)
|
|
|
|
| 3 |
|
| 4 |
const LanguagePlot = ({ data }) => {
|
| 5 |
const containerRef = useRef()
|
| 6 |
+
const languages = data.language_table.filter(a => a.average > 0)
|
| 7 |
const families = [...new Set(languages.map(a => a.family))]
|
| 8 |
|
| 9 |
useEffect(() => {
|
| 10 |
const plot = Plot.plot({
|
| 11 |
width: 750,
|
| 12 |
height: 500,
|
| 13 |
+
subtitle: 'Proficiency scores by language',
|
| 14 |
x: {
|
| 15 |
label: 'Number of Speakers',
|
| 16 |
type: 'log'
|
| 17 |
},
|
| 18 |
y: {
|
| 19 |
+
label: 'Language Proficiency Score'
|
| 20 |
},
|
| 21 |
marks: [
|
| 22 |
Plot.dot(languages, {
|
| 23 |
x: 'speakers',
|
| 24 |
y: d => d.average,
|
| 25 |
+
r: 'speakers',
|
| 26 |
fill: 'family',
|
| 27 |
+
title: d =>
|
| 28 |
+
`${d.language_name}\n${d.speakers.toLocaleString('en-US', {
|
| 29 |
+
notation: 'compact'
|
| 30 |
+
})} speakers\nScore: ${d.average.toFixed(2)}`,
|
| 31 |
tip: true
|
| 32 |
}),
|
| 33 |
+
Plot.text(
|
| 34 |
+
languages.filter(a => a.speakers > 5e8),
|
| 35 |
+
{
|
| 36 |
+
x: 'speakers',
|
| 37 |
+
y: d => d.average,
|
| 38 |
+
text: d => d.language_name,
|
| 39 |
+
fill: 'black',
|
| 40 |
+
frameAnchor: 'left',
|
| 41 |
+
dx: 10,
|
| 42 |
+
marginRight: 100
|
| 43 |
+
}
|
| 44 |
+
)
|
| 45 |
+
]
|
| 46 |
})
|
| 47 |
containerRef.current.append(plot)
|
| 48 |
return () => plot.remove()
|
|
|
|
| 56 |
height: '100%',
|
| 57 |
display: 'flex',
|
| 58 |
alignItems: 'center',
|
| 59 |
+
justifyContent: 'center'
|
| 60 |
}}
|
| 61 |
/>
|
| 62 |
)
|
frontend/src/components/SpeakerPlot.js
CHANGED
|
@@ -3,56 +3,81 @@ import * as Plot from '@observablehq/plot'
|
|
| 3 |
|
| 4 |
const SpeakerPlot = ({ data }) => {
|
| 5 |
const containerRef = useRef()
|
| 6 |
-
const allSpeakers = data.language_table.reduce(
|
| 7 |
-
|
| 8 |
-
|
| 9 |
-
|
| 10 |
-
|
| 11 |
-
|
| 12 |
-
|
| 13 |
-
|
| 14 |
-
|
| 15 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 16 |
|
| 17 |
useEffect(() => {
|
| 18 |
const plot = Plot.plot({
|
| 19 |
width: 750,
|
| 20 |
height: 500,
|
| 21 |
-
|
| 22 |
x: {
|
| 23 |
label: 'Languages',
|
| 24 |
-
ticks: []
|
| 25 |
},
|
| 26 |
y: {
|
| 27 |
-
label: 'Number of Speakers (millions)'
|
| 28 |
},
|
| 29 |
color: {
|
| 30 |
legend: true,
|
| 31 |
-
domain: [
|
| 32 |
-
range: [
|
| 33 |
},
|
| 34 |
marks: [
|
| 35 |
-
Plot.barY(languages,
|
| 36 |
-
|
| 37 |
-
x: "rank",
|
| 38 |
y: d => d.cumSpeakers / 1e6,
|
| 39 |
-
fill: d =>
|
| 40 |
sort: { x: 'y' },
|
| 41 |
-
title: d =>
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 42 |
tip: true // {y: d => d.cumSpeakers / 1e6 * 2}
|
| 43 |
}),
|
| 44 |
-
Plot.barY(languages,
|
| 45 |
-
|
| 46 |
-
x: "rank",
|
| 47 |
y: d => d.speakers / 1e6,
|
| 48 |
-
title: d =>
|
|
|
|
|
|
|
|
|
|
|
|
|
| 49 |
tip: true,
|
| 50 |
-
fill: d =>
|
| 51 |
sort: { x: '-y' }
|
| 52 |
}),
|
| 53 |
-
Plot.crosshairX(languages, {
|
| 54 |
-
|
| 55 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 56 |
})
|
| 57 |
containerRef.current.append(plot)
|
| 58 |
return () => plot.remove()
|
|
@@ -66,7 +91,7 @@ const SpeakerPlot = ({ data }) => {
|
|
| 66 |
height: '100%',
|
| 67 |
display: 'flex',
|
| 68 |
alignItems: 'center',
|
| 69 |
-
justifyContent: 'center'
|
| 70 |
}}
|
| 71 |
/>
|
| 72 |
)
|
|
|
|
| 3 |
|
| 4 |
const SpeakerPlot = ({ data }) => {
|
| 5 |
const containerRef = useRef()
|
| 6 |
+
const allSpeakers = data.language_table.reduce(
|
| 7 |
+
(sum, curr) => sum + curr.speakers,
|
| 8 |
+
0
|
| 9 |
+
)
|
| 10 |
+
const languages = data.language_table
|
| 11 |
+
.sort((a, b) => b.speakers - a.speakers)
|
| 12 |
+
.slice(0, 100)
|
| 13 |
+
.reduce((acc, d) => {
|
| 14 |
+
acc.push({
|
| 15 |
+
...d,
|
| 16 |
+
rank: acc.length + 1,
|
| 17 |
+
cumSpeakers:
|
| 18 |
+
acc.reduce((sum, curr) => sum + curr.speakers, 0) + d.speakers,
|
| 19 |
+
cumSpeakersPercent:
|
| 20 |
+
(acc.reduce((sum, curr) => sum + curr.speakers, 0) + d.speakers) /
|
| 21 |
+
allSpeakers
|
| 22 |
+
})
|
| 23 |
+
return acc
|
| 24 |
+
}, [])
|
| 25 |
|
| 26 |
useEffect(() => {
|
| 27 |
const plot = Plot.plot({
|
| 28 |
width: 750,
|
| 29 |
height: 500,
|
| 30 |
+
subtitle: 'Number of languages vs speakers covered',
|
| 31 |
x: {
|
| 32 |
label: 'Languages',
|
| 33 |
+
ticks: []
|
| 34 |
},
|
| 35 |
y: {
|
| 36 |
+
label: 'Number of Speakers (millions)'
|
| 37 |
},
|
| 38 |
color: {
|
| 39 |
legend: true,
|
| 40 |
+
domain: ['Speakers', 'Cumulative Speakers'],
|
| 41 |
+
range: ['green', 'lightgrey']
|
| 42 |
},
|
| 43 |
marks: [
|
| 44 |
+
Plot.barY(languages, {
|
| 45 |
+
x: 'rank',
|
|
|
|
| 46 |
y: d => d.cumSpeakers / 1e6,
|
| 47 |
+
fill: d => 'Cumulative Speakers',
|
| 48 |
sort: { x: 'y' },
|
| 49 |
+
title: d =>
|
| 50 |
+
`The ${
|
| 51 |
+
d.rank
|
| 52 |
+
} most spoken languages cover\n${d.cumSpeakersPercent.toLocaleString(
|
| 53 |
+
'en-US',
|
| 54 |
+
{ style: 'percent' }
|
| 55 |
+
)} of all speakers`,
|
| 56 |
tip: true // {y: d => d.cumSpeakers / 1e6 * 2}
|
| 57 |
}),
|
| 58 |
+
Plot.barY(languages, {
|
| 59 |
+
x: 'rank',
|
|
|
|
| 60 |
y: d => d.speakers / 1e6,
|
| 61 |
+
title: d =>
|
| 62 |
+
`${d.language_name}\n(${d.speakers.toLocaleString('en-US', {
|
| 63 |
+
notation: 'compact',
|
| 64 |
+
compactDisplay: 'long'
|
| 65 |
+
})} speakers)`,
|
| 66 |
tip: true,
|
| 67 |
+
fill: d => 'Speakers',
|
| 68 |
sort: { x: '-y' }
|
| 69 |
}),
|
| 70 |
+
Plot.crosshairX(languages, {
|
| 71 |
+
x: 'rank',
|
| 72 |
+
y: d => d.cumSpeakers / 1e6,
|
| 73 |
+
textStrokeOpacity: 0,
|
| 74 |
+
textFillOpacity: 0
|
| 75 |
+
}),
|
| 76 |
+
Plot.tip(['The 41 most spoken languages cover 80% of all speakers.'], {
|
| 77 |
+
x: 41,
|
| 78 |
+
y: languages[40].cumSpeakers / 1e6
|
| 79 |
+
})
|
| 80 |
+
]
|
| 81 |
})
|
| 82 |
containerRef.current.append(plot)
|
| 83 |
return () => plot.remove()
|
|
|
|
| 91 |
height: '100%',
|
| 92 |
display: 'flex',
|
| 93 |
alignItems: 'center',
|
| 94 |
+
justifyContent: 'center'
|
| 95 |
}}
|
| 96 |
/>
|
| 97 |
)
|
frontend/src/components/WorldMap.js
CHANGED
|
@@ -44,6 +44,7 @@ const WorldMap = ({ data }) => {
|
|
| 44 |
return acc
|
| 45 |
}, {})
|
| 46 |
const plot = Plot.plot({
|
|
|
|
| 47 |
width: 750,
|
| 48 |
height: 500,
|
| 49 |
projection: 'equal-earth',
|
|
|
|
| 44 |
return acc
|
| 45 |
}, {})
|
| 46 |
const plot = Plot.plot({
|
| 47 |
+
subtitle: 'Language Proficiency Score by Country',
|
| 48 |
width: 750,
|
| 49 |
height: 500,
|
| 50 |
projection: 'equal-earth',
|