data.table dblp similarity.threshold .9 prefix.extension 1