/** * 计算逆文本频率idf(w) * * @param c */ def idf(c:String, mapGjbz:Seq[String]):Double = { var count = 0 //trainMap.foreach(f => { mapGjbz.foreach(f => { if (f.contains(c)) { count += 1 } }) if (count == 0) { return 0 } else { return math.log(mapGjbz.size.toDouble / count) } }
转载于:https://my.oschina.net/shea1992/blog/1604086