= udf { (document0: String, document1: String) =>
val set1 = document0.split("@@@").toSet
val set2 = document1.split("@@@").toSet
val intersect_set = set1.intersect(set2)
if(intersect_set.size / set1.size > 0.8 && intersect_set.size / set2.size > 0.8) {
true
}else{
false
}
}

val jdf = df1.join(df2, intersectFn(df1("str_col1"),df2("str_col2")))