in src/main/scala/com/twitter/penguin/korean/tokenizer/ParsedChunk.scala [75:94]
def isAllNouns = if (this.posNodes.exists(
t => t.pos != Noun && t.pos != ProperNoun)) 1
else 0
def isPreferredPattern = if (
posNodes.size == 2 && profile.preferredPatterns.contains(posNodes.map(_.pos))
) 0
else 1
def isNounHa = if (this.posNodes.size >= 2
&& preferredBeforeHaVerb.contains(this.posNodes.head.pos)
&& this.posNodes(1).pos == Verb
&& this.posNodes(1).text.startsWith("하")) 0
else 1
def posTieBreaker = this.posNodes.map(_.pos.id).sum
def getUnknownCoverage = this.posNodes.foldLeft(0) {
case (sum, p: KoreanToken) => if (p.unknown) sum + p.text.length else sum
}