probability_by_gender = data_work
.dedupe()
.orderby("date")
.groupby(["item", "itemLabel"])
.slice(0,1)
.join_left(data_artistes, "item")
.ungroup()
.groupby(["genderLabel", "type"])
.count()
.ungroup()
.groupby("genderLabel")
.derive({share: d => 100 * d.count/op.sum(d.count)})