ggplot(data,aes(similarity,color=alg_name,group=alg_name))+stat_ecdf(geom="step")+xlab("SIM")+ylab("Fraction of jobs")+theme(legend.position="bottom")+scale_color_brewer(palette="Set2")
ggsave("ecdf.png")
e=data%>%filter(similarity>=0.5)
ggplot(e,aes(similarity,color=alg_name,group=alg_name))+stat_ecdf(geom="step")+xlab("SIM")+ylab("Fraction of jobs")+theme(legend.position="bottom")+scale_color_brewer(palette="Set2")
print(summary(e))
ggsave("ecdf-0.5.png")
# histogram for the jobs
ggplot(data,aes(similarity),group=alg_name)+geom_histogram(color="black",binwidth=0.025)+aes(fill=alg_name)+facet_grid(alg_name~.,switch='y')+scale_y_continuous(limits=c(0,100),oob=squish)+scale_color_brewer(palette="Set2")+ylab("Count (cropped at 100)")