function tokenCounts(n, gt = 0){
return Plot.plot({
caption: `Count of documents with less than ${n} tokens` + (gt ? ` and more than ${gt} tokens.` : ``),
marks: [
Plot.barX(
counts.filter(d => d.tokens <= n && d.tokens > gt),
Plot.groupY(
{ x: "count", title: "count" },
{
y: "pile_set_name",
x: "tokens",
fill: "pile_set_name",
sort: { y: "x", reverse: true, limit: 22 }
}
)
),
Plot.ruleX([0])
],
marginLeft: 120,
marginRight: 80,
fy: {
domain: ["sub200", "sub4k", "sub8k", "sub32k", "lots"]
},
y: {
label: null
},
color: { domain: colors.domain },
grid: true,
height: 300
})
}