blob: 4480d7814015c679cbe35599af198e138ec97757 [file] [log] [blame]
package org.qcri.rheem.apps.simwords
/**
* Scrubs texts.
*/
class TextScrubber {
def splitAndScrub(line: String, collector: java.util.List[String]): Unit = {
for (token <- line.split("""\W""") if !token.isEmpty) {
collector.add(token.toLowerCase)
}
}
}