nlpcraft/src/main/scala/org/apache/nlpcraft/model/intent/solver/NCIntentSolverEngine.scala - incubator-nlpcraft - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *      https://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 package org.apache.nlpcraft.model.intent.solver

 import com.typesafe.scalalogging.LazyLogging
 import org.apache.nlpcraft.common._
 import org.apache.nlpcraft.common.ascii.NCAsciiTable
 import org.apache.nlpcraft.common.debug.{NCLogGroupToken, NCLogHolder}
 import org.apache.nlpcraft.common.opencensus.NCOpenCensusTrace
 import org.apache.nlpcraft.model.impl.NCTokenLogger
 import org.apache.nlpcraft.model.impl.NCTokenPimp._
 import org.apache.nlpcraft.model.intent.{NCIdlContext, NCIdlFunction, NCIdlIntent, NCIdlIntentOptions, NCIdlTerm, NCIdlStackItem => Z}
 import org.apache.nlpcraft.model.{NCContext, NCDialogFlowItem, NCIntentMatch, NCResult, NCToken}
 import org.apache.nlpcraft.probe.mgrs.dialogflow.NCDialogFlowManager

 import java.util.function.Function
 import java.util.{List => JList}
 import scala.collection.mutable
 import scala.jdk.CollectionConverters.{CollectionHasAsScala, MapHasAsScala, SeqHasAsJava}

 /**
  * Intent solver that finds the best matching intent given user sentence.
  */
 object NCIntentSolverEngine extends LazyLogging with NCOpenCensusTrace {

     /**
      * NOTE: not thread-safe.
      */
     private[solver] class Weight(ws: Int*) extends Ordered[Weight] {
         private var buf = mutable.ArrayBuffer[Int]()

         buf.appendAll(ws)

         /**
          * Adds given weight to this weight.
          *
          * @param that Weight to add.
          * @return
          */
         def +=(that: Weight): Weight = {
             val buf2 = mutable.ArrayBuffer[Int]()

             for (i <- 0 until Math.max(buf.size, that.buf.size))
                 buf2.append(norm(i, buf) + norm(i, that.buf))

             buf = buf2

             this
         }

         /**
          * Appends new weight.
          *
          * @param w New weight to append.
          * @return
          */
         def append(w: Int): Weight = {
             buf.append(w)

             this
         }

         /**
          * Prepends new weight.
          *
          * @param w New weight to prepend.
          * @return
          */
         def prepend(w: Int): Weight = {
             buf.prepend(w)

             this
         }

         /**
          * Sets specific weight at a given index.
          *
          * @param idx
          * @param w
          */
         def setWeight(idx: Int, w: Int): Unit =
             buf(idx) = w

         /**
          * Gets element at given index or zero if index is out of bounds.
          *
          * @param i Index in collection.
          * @param c Collection.
          * @return
          */
         private def norm(i: Int, c: mutable.ArrayBuffer[Int]): Int = if (i < c.size) c(i) else 0

         /**
          *
          * @param that
          * @return
          */
         override def compare(that: Weight): Int = {
             var res = 0

             for (i <- 0 until Math.max(buf.size, that.buf.size) if res == 0)
                 res = Integer.compare(norm(i, buf), norm(i, that.buf))

             res
         }

         def toSeq: Seq[Int] = buf.toSeq
         def toAnsiString: String = buf.mkString(y(bo("[")), ", ", y(bo("]")))
     }

     /**
      *
      * @param used
      * @param token
      */
     private case class IntentToken(
         var used: Boolean,
         var conv: Boolean,
         token: NCToken
     )

     /**
      * @param termId
      * @param usedTokens
      * @param weight
      */
     private case class TermMatch(
         termId: Option[String],
         usedTokens: List[IntentToken],
         weight: Weight
     ) {
         lazy val maxIndex: Int = usedTokens.maxBy(_.token.index).token.index
     }

     /**
      *
      * @param term
      * @param usedTokens
      */
     private case class TermTokensGroup(
         term: NCIdlTerm,
         usedTokens: List[IntentToken]
     )

     /**
      *
      * @param tokenGroups
      * @param weight
      * @param intent
      */
     private case class IntentMatch(
         tokenGroups: List[TermTokensGroup],
         weight: Weight,
         intent: NCIdlIntent
     )

     /**
      * Main entry point for intent engine.
      *
      * @param ctx Query context.
      * @param intents Set of intents to match for.
      * @param logHldr Log holder.
      * @return
      */
     @throws[NCE]
     def solve(
         ctx: NCContext,
         intents: List[(NCIdlIntent /*Intent*/ , NCIntentMatch => NCResult) /*Callback*/ ],
         logHldr: NCLogHolder
     ): List[NCIntentSolverResult] = {
         case class MatchHolder(
             intentMatch: IntentMatch, // Match.
             callback: Function[NCIntentMatch, NCResult], // Callback function.
             variant: NCIntentSolverVariant, // Variant used for the match.
             variantIdx: Int // Variant index.
         )

         val req = ctx.getRequest

         startScopedSpan("solve",
             "srvReqId" -> req.getServerRequestId,
             "userId" -> req.getUser.getId,
             "mdlId" -> ctx.getModel.getId,
             "normText" -> req.getNormalizedText) { _ =>
             val matches = mutable.ArrayBuffer.empty[MatchHolder]

             // Find all matches across all intents and sentence variants.
             for ((vrn, vrnIdx) <- ctx.getVariants.asScala.zipWithIndex) {
                 val availToks = vrn.asScala.filter(t => !t.isStopWord)

                 matches.appendAll(
                     intents.flatMap(pair => {
                         val intent = pair._1
                         val callback = pair._2

                         // Isolated sentence tokens.
                         val senToks = Seq.empty[IntentToken] ++ availToks.map(IntentToken(false, false, _))
                         val senTokGroups = availToks.map(t => if (t.getGroups != null) t.getGroups.asScala.sorted else Seq.empty)

                         // Isolated conversation tokens.
                         val convToks =
                             if (intent.terms.exists(_.conv))
                                 Seq.empty[IntentToken] ++
                                     // We do not mix tokens with same group from the conversation and given sentence.
                                     ctx.getConversation.getTokens.asScala.
                                         filter(t => {
                                             val convTokGroups = t.getGroups.asScala.sorted

                                             !senTokGroups.exists(convTokGroups.containsSlice)
                                         }).
                                         map(IntentToken(used = false, conv = true, _))
                             else
                                 Seq.empty[IntentToken]

                         // Solve intent in isolation.
                         solveIntent(ctx, intent, senToks, convToks, vrnIdx) match {
                             case Some(intentMatch) => Some(MatchHolder(intentMatch, callback, NCIntentSolverVariant(vrn), vrnIdx))
                             case None => None
                         }
                     })
                 )
             }

             val sorted = matches.sortWith((m1: MatchHolder, m2: MatchHolder) =>
                 // 1. First with maximum weight.
                 m1.intentMatch.weight.compare(m2.intentMatch.weight) match {
                     case x1 if x1 < 0 => false
                     case x1 if x1 > 0 => true
                     case x1 =>
                         require(x1 == 0)

                         val mw1 = m1.intentMatch.weight
                         val mw2 = m2.intentMatch.weight

                         val v1 = m1.variant
                         val v2 = m2.variant

                         val tbl = new NCAsciiTable()

                         tbl += (
                             s"${c("Intent ID")}",
                             m1.intentMatch.intent.id,
                             m2.intentMatch.intent.id
                         )
                         tbl += (
                             s"${c("Variant #")}",
                             m1.variantIdx + 1,
                             m2.variantIdx + 1
                         )

                         tbl += (
                             s"${c("Intent Match Weight")}",
                             mw1.toAnsiString,
                             mw2.toAnsiString
                         )

                         tbl += (
                             s"${c("Variant Weight")}",
                             v1.toAnsiString,
                             v2.toAnsiString
                         )

                         logger.warn(
                             s"Two matching intents have the ${y(bo("same weight"))} for their matches (variants weight will be used further):\n" +
                             tbl.toString
                         )

                         // 2. First with maximum variant.
                         m1.variant.compareTo(m2.variant) match {
                             case x2 if x2 < 0 => false
                             case x2 if x2 > 0 => true
                             case x2 =>
                                 require(x2 == 0)

                                 def calcHash(m: MatchHolder): Int = {
                                     val variantPart =
                                         m.variant.
                                             tokens.
                                             asScala.
                                             map(t => s"${t.getId}${t.getGroups}${t.getValue}${t.normText}").
                                             mkString("")

                                     val intentPart = m.intentMatch.intent.toString

                                     (variantPart, intentPart).##
                                 }

                                 // Order doesn't make sense here.
                                 // It is just to provide deterministic result for the matches with the same weights.
                                 calcHash(m1) > calcHash(m2)
                         }
                 }
             )

             if (sorted.nonEmpty) {
                 val tbl = NCAsciiTable("Variant", "Intent", "Term Tokens", "Intent Match Weight")

                 sorted.foreach(m => {
                     val im = m.intentMatch
                     val w = im.weight

                     if (m == sorted.head)
                         tbl += (
                             Seq(
                                 s"#${m.variantIdx + 1}",
                                 g(bo("best match"))
                             ),
                             Seq(
                                 im.intent.id,
                                 g(bo("best match"))
                             ),
                             mkPickTokens(im),
                             w.toAnsiString
                         )
                     else
                         tbl += (
                             s"#${m.variantIdx + 1}",
                             im.intent.id,
                             mkPickTokens(im),
                             w.toAnsiString
                         )

                     if (logHldr != null)
                         logHldr.addIntent(
                             im.intent.id,
                             im.weight.toSeq,
                             im.tokenGroups.map(g =>
                                 g.term.id.getOrElse("") -> g.usedTokens.map(t => NCLogGroupToken(t.token, t.conv, t.used))
                             ).toMap
                         )
                 })

                 tbl.info(logger, Some(s"Found ${sorted.size} matching ${if (sorted.size > 1) "intents" else "intent"} (sorted $G${BO}best$RST to worst):"))
             }
             else
                 logger.info("No matching intent found.")

             sorted.map(m =>
                 NCIntentSolverResult(
                     m.intentMatch.intent.id,
                     m.callback,
                     m.intentMatch.tokenGroups.map(grp => NCIntentTokensGroup(grp.term.id, grp.usedTokens.map(_.token))),
                     m.variant,
                     m.variantIdx
                 )
             ).toList
         }
     }

     /**
      *
      * @param im
      * @return
      */
     private def mkPickTokens(im: IntentMatch): List[String] = {
         val buf = mutable.ListBuffer.empty[String]

         val intent = im.intent

         buf += s"intent=${intent.id}"

         var grpIdx = 0

         for (grp <- im.tokenGroups) {
             buf += s"  ${grp.term.toAnsiString}"

             grpIdx += 1

             if (grp.usedTokens.nonEmpty) {
                 var tokIdx = 0

                 for (tok <- grp.usedTokens) {
                     val conv = if (tok.conv) "(conv) " else ""

                     buf += s"    #$tokIdx: $conv${tok.token}"

                     tokIdx += 1
                 }
             }
             else
                 buf += "    <empty>"
         }

         buf.toList
     }

     /**
      *
      * @param intent
      * @param senToks
      * @param convToks
      * @return
      */
     private def solveIntent(
         ctx: NCContext,
         intent: NCIdlIntent,
         senToks: Seq[IntentToken],
         convToks: Seq[IntentToken],
         varIdx: Int
     ): Option[IntentMatch] = {
         val intentId = intent.id
         val opts = intent.options
         val flow = NCDialogFlowManager.getDialogFlow(ctx.getRequest.getUser.getId, ctx.getModel.getId)
         val varStr = s"(variant #${varIdx + 1})"
         val flowRegex = intent.flowRegex

         var flowMatched = true

         // Check dialog flow regex first, if any.
         if (intent.flowRegex.isDefined) {
             val str = flow.map(_.getIntentId).mkString(" ")

             def x(s: String): Unit = {
                 logger.info(s"Intent '$intentId' $s regex dialog flow $varStr:")
                 logger.info(s"  |-- ${c("Intent IDs  :")} $str")
                 logger.info(s"  +-- ${c("Match regex :")} ${flowRegex.get.toString}")
             }

             if (!flowRegex.get.matcher(str).find(0)) {
                 x(s"${bo(r("did not match"))}")

                 flowMatched = false
             }
             else
                 x(s"matched")
         }
         else if (intent.flowMtdName.isDefined) {
             val clsName = intent.flowClsName.orNull
             val mtdName = intent.flowMtdName.get

             val fqn =
                 s"${if (clsName == null) ctx.getModel.getClass.getName else clsName}." +
                 s"$mtdName(JList[NCDialogFlowItem])"

             val res =
                 try
                     U.callMethod[JList[NCDialogFlowItem], java.lang.Boolean](
                         () => if (clsName == null) ctx.getModel else U.mkObject(clsName),
                         mtdName,
                         flow.toList.asJava
                     )
                 catch {
                     case e: Exception =>
                         throw new NCE(s"Failed to invoke custom flow callback: $fqn", e)
                 }

             def x(s: String): Unit = {
                 logger.info(s"Intent '$intentId' $s custom flow callback $varStr:")
                 logger.info(s"  +-- ${c("Custom callback :")} $fqn")
             }

             if (!res) {
                 x(s"${bo(r("did not match"))}")

                 flowMatched = false
             }
             else
                 x("matched")
         }

         if (flowMatched) {
             val intentW = new Weight()
             val intentGrps = mutable.ListBuffer.empty[TermTokensGroup]
             var abort = false
             var lastTermMatch: TermMatch = null

             // Conversation metadata (shared across all terms).
             val x = ctx.getConversation.getMetadata
             val convMeta = if (x.isEmpty) Map.empty[String, Object] else x.asScala.toMap[String, Object]

             // Check terms.
             for (term <- intent.terms if !abort) {
                 // Fresh context for each term.
                 val termCtx = NCIdlContext(
                     intentMeta = intent.meta,
                     convMeta = convMeta,
                     req = ctx.getRequest,
                     vars = mutable.HashMap.empty[String, NCIdlFunction] ++ term.decls
                 )

                 solveTerm(
                     term,
                     termCtx,
                     senToks,
                     if (term.conv) convToks else Seq.empty
                 ) match {
                     case Some(termMatch) =>
                         if (opts.ordered && lastTermMatch != null && lastTermMatch.maxIndex > termMatch.maxIndex)
                             abort = true
                         else {
                             // Term is found.
                             // Add its weight and grab its tokens.
                             intentW += termMatch.weight
                             intentGrps += TermTokensGroup(term, termMatch.usedTokens)
                             lastTermMatch = termMatch

                             val tbl = NCAsciiTable()

                             val w = termMatch.weight.toSeq

                             tbl += (s"${B}Intent ID$RST", s"$BO${intent.id}$RST")
                             tbl += (s"${B}Matched Term$RST", term.toAnsiString)
                             tbl += (s"${B}Matched Tokens$RST", termMatch.usedTokens.map(t => {
                                 val txt = t.token.getOriginalText
                                 val idx = t.token.getIndex

                                 s"$txt${c("[" + idx + "]")}"
                             }).mkString(" "))
                             tbl += (
                                 s"${B}Term Match Weight$RST",
                                 s"${y("<")}${w.head}, ${w(1)}, ${w(2)}, ${w(3)}, ${w(4)}, ${w(5)}${y(">")}"
                             )

                             tbl.info(logger, Some("Term match found:"))
                         }

                     case None =>
                         // Term is missing. Stop further processing for this intent. This intent cannot be matched.
                         logger.info(s"Intent '$intentId' ${bo(r("did not match"))} because of unmatched term '${term.toAnsiString}' $varStr.")

                         abort = true
                 }
             }

             if (abort)
                 None
             else {
                 val usedSenToks = senToks.filter(_.used)
                 val unusedSenToks = senToks.filter(!_.used)
                 val usedConvToks = convToks.filter(_.used)

                 var res: Option[IntentMatch] = None

                 import NCIdlIntentOptions._

                 if (!opts.allowStmTokenOnly && usedSenToks.isEmpty && usedConvToks.nonEmpty)
                     logger.info(
                         s"Intent '$intentId' ${bo(r("did not match"))} because all its matched tokens came from STM $varStr. " +
                         s"See intent '${c(JSON_ALLOW_STM_ONLY)}' option."
                     )
                 else if (!opts.ignoreUnusedFreeWords && unusedSenToks.exists(_.token.isFreeWord))
                     NCTokenLogger.prepareTable(
                         unusedSenToks.filter(_.token.isFreeWord).map(_.token)
                     ).
                     info(
                         logger,
                         Some(
                             s"Intent '$intentId' ${bo(r("did not match"))} because of unused free words $varStr. " +
                             s"See intent '${c(JSON_UNUSED_FREE_WORDS)}' option. " +
                             s"Unused free words:"
                         )
                     )
                 else if (!opts.ignoreUnusedUserTokens && unusedSenToks.exists(_.token.isUserDefined))
                     NCTokenLogger.prepareTable(
                         unusedSenToks.filter(_.token.isUserDefined).map(_.token)
                     ).
                     info(
                         logger,
                         Some(
                             s"Intent '$intentId' ${bo(r("did not match"))} because of unused user tokens $varStr. " +
                             s"See intent '${c(JSON_UNUSED_USR_TOKS)}' option. " +
                             s"Unused user tokens:"
                         )
                     )
                 else if (!opts.ignoreUnusedSystemTokens && unusedSenToks.exists(tok => !tok.token.isFreeWord && tok.token.isSystemDefined))
                     NCTokenLogger.prepareTable(
                         unusedSenToks.filter(tok => !tok.token.isFreeWord && tok.token.isSystemDefined).map(_.token)
                     ).
                     info(
                         logger,
                         Some(
                             s"Intent '$intentId' ${bo(r("did not match"))} because of unused system tokens $varStr. " +
                             s"See intent '${c(JSON_UNUSED_SYS_TOKS)}' option. " +
                             s"Unused system tokens:"
                         )
                     )
                 else {
                     if (usedSenToks.isEmpty && usedConvToks.isEmpty)
                         logger.warn(s"Intent '$intentId' ${bo(y("matched"))} but no tokens were used $varStr.")

                     // Number of remaining (unused) non-free words in the sentence is a measure of exactness of the match.
                     // The match is exact when all non-free words are used in that match.
                     // Negate to make sure the bigger (smaller negative number) is better.
                     val nonFreeWordNum = -senToks.count(t => !t.used && !t.token.isFreeWord)

                     intentW.prepend(nonFreeWordNum)

                     res = Some(IntentMatch(
                         tokenGroups = intentGrps.toList,
                         weight = intentW,
                         intent = intent
                     ))
                 }

                 res
             }
         }
         else
             None
     }

     /**
      * Solves term.
      *
      * @param term
      * @param ctx
      * @param convToks
      * @param senToks
      * @return
      */
     @throws[NCE]
     private def solveTerm(
         term: NCIdlTerm,
         ctx: NCIdlContext,
         senToks: Seq[IntentToken],
         convToks: Seq[IntentToken]
     ): Option[TermMatch] = {
         if (senToks.isEmpty && convToks.isEmpty)
             logger.warn(s"No tokens available to match on for term '${term.toAnsiString}'.")

         try
             solvePredicate(term.pred, ctx, term.min, term.max, senToks, convToks) match {
                 case Some((usedToks, predWeight)) => Some(
                     TermMatch(
                         term.id,
                         usedToks,
                         // If term match is non-empty we add the following weights:
                         //   - min
                         //   - delta between specified max and normalized max (how close the actual quantity was to the specified one).
                         //   - normalized max
                         // NOTE: 'usedToks' can be empty.
                         predWeight
                             .append(term.min)
                             .append(-(term.max - usedToks.size))
                             // Normalize max quantifier in case of unbound max.
                             .append(if (term.max == Integer.MAX_VALUE) usedToks.size else term.max)
                     )
                 )

                 // Term not found at all.
                 case None => None
             }
         catch {
             case e: Exception => throw new NCE(s"Runtime error processing IDL term: ${term.toAnsiString}", e)
         }
     }

     /**
      * Solves term's predicate.
      *
      * @param pred
      * @param ctx
      * @param min
      * @param max
      * @param senToks
      * @param convToks
      * @return
      */
     @throws[NCE]
     private def solvePredicate(
         pred: (NCToken, NCIdlContext) => Z,
         ctx: NCIdlContext,
         min: Int,
         max: Int,
         senToks: Seq[IntentToken],
         convToks: Seq[IntentToken]
     ): Option[(List[IntentToken], Weight)] = {
         // Algorithm is "hungry", i.e. it will fetch all tokens satisfying item's predicate
         // in entire sentence even if these tokens are separated by other already used tokens
         // and conversation will be used only to get to the 'max' number of the item.

         var usedToks = List.empty[IntentToken]

         var matches = 0
         var tokUses = 0

         val allToks = Seq(senToks, convToks)

         // Collect to the 'max' from sentence & conversation, if possible.
         for (col <- allToks; tok <- col.filter(!_.used) if usedToks.lengthCompare(max) < 0) {
             val Z(res, uses) = pred.apply(tok.token, ctx)

             res match {
                 case b: java.lang.Boolean =>
                     if (b) {
                         matches += 1

                         if (uses > 0) {
                             tokUses += uses
                             usedToks :+= tok
                         }
                     }

                 case _ =>
                     throw new NCE(s"Predicate returned non-boolean result: $res")
             }
         }

         // We couldn't collect even 'min' matches.
         if (matches < min)
             None
         // Term is optional (min == 0) and no matches found (valid result).
         else if (matches == 0) {
             require(min == 0)
             require(usedToks.isEmpty)

             Some(usedToks -> new Weight(0, 0, 0))
         }
         // We've found some matches (and min > 0).
         else {
             require(matches >= min)

             val convSrvReqIds = convToks.map(_.token.getServerRequestId).distinct

             // Number of tokens from the current sentence.
             val senTokNum = usedToks.count(t => !convSrvReqIds.contains(t.token.getServerRequestId))

             // Sum of conversation depths for each token from the conversation.
             // Negated to make sure that bigger (smaller negative number) is better.
             val convDepthsSum = -usedToks.filter(t => convSrvReqIds.contains(t.token.getServerRequestId)).zipWithIndex.map(_._2 + 1).sum

             // Mark found tokens as used.
             usedToks.foreach(_.used = true)

             Some(usedToks -> new Weight(
                 senTokNum,
                 convDepthsSum,
                 tokUses
             ))
         }
     }
 }
	/*
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* https://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	package org.apache.nlpcraft.model.intent.solver

	import com.typesafe.scalalogging.LazyLogging
	import org.apache.nlpcraft.common._
	import org.apache.nlpcraft.common.ascii.NCAsciiTable
	import org.apache.nlpcraft.common.debug.{NCLogGroupToken, NCLogHolder}
	import org.apache.nlpcraft.common.opencensus.NCOpenCensusTrace
	import org.apache.nlpcraft.model.impl.NCTokenLogger
	import org.apache.nlpcraft.model.impl.NCTokenPimp._
	import org.apache.nlpcraft.model.intent.{NCIdlContext, NCIdlFunction, NCIdlIntent, NCIdlIntentOptions, NCIdlTerm, NCIdlStackItem => Z}
	import org.apache.nlpcraft.model.{NCContext, NCDialogFlowItem, NCIntentMatch, NCResult, NCToken}
	import org.apache.nlpcraft.probe.mgrs.dialogflow.NCDialogFlowManager

	import java.util.function.Function
	import java.util.{List => JList}
	import scala.collection.mutable
	import scala.jdk.CollectionConverters.{CollectionHasAsScala, MapHasAsScala, SeqHasAsJava}

	/**
	* Intent solver that finds the best matching intent given user sentence.
	*/
	object NCIntentSolverEngine extends LazyLogging with NCOpenCensusTrace {

	/**
	* NOTE: not thread-safe.
	*/
	private[solver] class Weight(ws: Int*) extends Ordered[Weight] {
	private var buf = mutable.ArrayBuffer[Int]()

	buf.appendAll(ws)

	/**
	* Adds given weight to this weight.
	*
	* @param that Weight to add.
	* @return
	*/
	def +=(that: Weight): Weight = {
	val buf2 = mutable.ArrayBuffer[Int]()

	for (i <- 0 until Math.max(buf.size, that.buf.size))
	buf2.append(norm(i, buf) + norm(i, that.buf))

	buf = buf2

	this
	}

	/**
	* Appends new weight.
	*
	* @param w New weight to append.
	* @return
	*/
	def append(w: Int): Weight = {
	buf.append(w)

	this
	}

	/**
	* Prepends new weight.
	*
	* @param w New weight to prepend.
	* @return
	*/
	def prepend(w: Int): Weight = {
	buf.prepend(w)

	this
	}

	/**
	* Sets specific weight at a given index.
	*
	* @param idx
	* @param w
	*/
	def setWeight(idx: Int, w: Int): Unit =
	buf(idx) = w

	/**
	* Gets element at given index or zero if index is out of bounds.
	*
	* @param i Index in collection.
	* @param c Collection.
	* @return
	*/
	private def norm(i: Int, c: mutable.ArrayBuffer[Int]): Int = if (i < c.size) c(i) else 0

	/**
	*
	* @param that
	* @return
	*/
	override def compare(that: Weight): Int = {
	var res = 0

	for (i <- 0 until Math.max(buf.size, that.buf.size) if res == 0)
	res = Integer.compare(norm(i, buf), norm(i, that.buf))

	res
	}

	def toSeq: Seq[Int] = buf.toSeq
	def toAnsiString: String = buf.mkString(y(bo("[")), ", ", y(bo("]")))
	}

	/**
	*
	* @param used
	* @param token
	*/
	private case class IntentToken(
	var used: Boolean,
	var conv: Boolean,
	token: NCToken
	)

	/**
	* @param termId
	* @param usedTokens
	* @param weight
	*/
	private case class TermMatch(
	termId: Option[String],
	usedTokens: List[IntentToken],
	weight: Weight
	) {
	lazy val maxIndex: Int = usedTokens.maxBy(_.token.index).token.index
	}

	/**
	*
	* @param term
	* @param usedTokens
	*/
	private case class TermTokensGroup(
	term: NCIdlTerm,
	usedTokens: List[IntentToken]
	)

	/**
	*
	* @param tokenGroups
	* @param weight
	* @param intent
	*/
	private case class IntentMatch(
	tokenGroups: List[TermTokensGroup],
	weight: Weight,
	intent: NCIdlIntent
	)

	/**
	* Main entry point for intent engine.
	*
	* @param ctx Query context.
	* @param intents Set of intents to match for.
	* @param logHldr Log holder.
	* @return
	*/
	@throws[NCE]
	def solve(
	ctx: NCContext,
	intents: List[(NCIdlIntent /Intent/ , NCIntentMatch => NCResult) /Callback/ ],
	logHldr: NCLogHolder
	): List[NCIntentSolverResult] = {
	case class MatchHolder(
	intentMatch: IntentMatch, // Match.
	callback: Function[NCIntentMatch, NCResult], // Callback function.
	variant: NCIntentSolverVariant, // Variant used for the match.
	variantIdx: Int // Variant index.
	)

	val req = ctx.getRequest

	startScopedSpan("solve",
	"srvReqId" -> req.getServerRequestId,
	"userId" -> req.getUser.getId,
	"mdlId" -> ctx.getModel.getId,
	"normText" -> req.getNormalizedText) { _ =>
	val matches = mutable.ArrayBuffer.empty[MatchHolder]

	// Find all matches across all intents and sentence variants.
	for ((vrn, vrnIdx) <- ctx.getVariants.asScala.zipWithIndex) {
	val availToks = vrn.asScala.filter(t => !t.isStopWord)

	matches.appendAll(
	intents.flatMap(pair => {
	val intent = pair._1
	val callback = pair._2

	// Isolated sentence tokens.
	val senToks = Seq.empty[IntentToken] ++ availToks.map(IntentToken(false, false, _))
	val senTokGroups = availToks.map(t => if (t.getGroups != null) t.getGroups.asScala.sorted else Seq.empty)

	// Isolated conversation tokens.
	val convToks =
	if (intent.terms.exists(_.conv))
	Seq.empty[IntentToken] ++
	// We do not mix tokens with same group from the conversation and given sentence.
	ctx.getConversation.getTokens.asScala.
	filter(t => {
	val convTokGroups = t.getGroups.asScala.sorted

	!senTokGroups.exists(convTokGroups.containsSlice)
	}).
	map(IntentToken(used = false, conv = true, _))
	else
	Seq.empty[IntentToken]

	// Solve intent in isolation.
	solveIntent(ctx, intent, senToks, convToks, vrnIdx) match {
	case Some(intentMatch) => Some(MatchHolder(intentMatch, callback, NCIntentSolverVariant(vrn), vrnIdx))
	case None => None
	}
	})
	)
	}

	val sorted = matches.sortWith((m1: MatchHolder, m2: MatchHolder) =>
	// 1. First with maximum weight.
	m1.intentMatch.weight.compare(m2.intentMatch.weight) match {
	case x1 if x1 < 0 => false
	case x1 if x1 > 0 => true
	case x1 =>
	require(x1 == 0)

	val mw1 = m1.intentMatch.weight
	val mw2 = m2.intentMatch.weight

	val v1 = m1.variant
	val v2 = m2.variant

	val tbl = new NCAsciiTable()

	tbl += (
	s"${c("Intent ID")}",
	m1.intentMatch.intent.id,
	m2.intentMatch.intent.id
	)
	tbl += (
	s"${c("Variant #")}",
	m1.variantIdx + 1,
	m2.variantIdx + 1
	)

	tbl += (
	s"${c("Intent Match Weight")}",
	mw1.toAnsiString,
	mw2.toAnsiString
	)

	tbl += (
	s"${c("Variant Weight")}",
	v1.toAnsiString,
	v2.toAnsiString
	)

	logger.warn(
	s"Two matching intents have the ${y(bo("same weight"))} for their matches (variants weight will be used further):\n" +
	tbl.toString
	)

	// 2. First with maximum variant.
	m1.variant.compareTo(m2.variant) match {
	case x2 if x2 < 0 => false
	case x2 if x2 > 0 => true
	case x2 =>
	require(x2 == 0)

	def calcHash(m: MatchHolder): Int = {
	val variantPart =
	m.variant.
	tokens.
	asScala.
	map(t => s"${t.getId}${t.getGroups}${t.getValue}${t.normText}").
	mkString("")

	val intentPart = m.intentMatch.intent.toString

	(variantPart, intentPart).##
	}

	// Order doesn't make sense here.
	// It is just to provide deterministic result for the matches with the same weights.
	calcHash(m1) > calcHash(m2)
	}
	}
	)

	if (sorted.nonEmpty) {
	val tbl = NCAsciiTable("Variant", "Intent", "Term Tokens", "Intent Match Weight")

	sorted.foreach(m => {
	val im = m.intentMatch
	val w = im.weight

	if (m == sorted.head)
	tbl += (
	Seq(
	s"#${m.variantIdx + 1}",
	g(bo("best match"))
	),
	Seq(
	im.intent.id,
	g(bo("best match"))
	),
	mkPickTokens(im),
	w.toAnsiString
	)
	else
	tbl += (
	s"#${m.variantIdx + 1}",
	im.intent.id,
	mkPickTokens(im),
	w.toAnsiString
	)

	if (logHldr != null)
	logHldr.addIntent(
	im.intent.id,
	im.weight.toSeq,
	im.tokenGroups.map(g =>
	g.term.id.getOrElse("") -> g.usedTokens.map(t => NCLogGroupToken(t.token, t.conv, t.used))
	).toMap
	)
	})

	tbl.info(logger, Some(s"Found ${sorted.size} matching ${if (sorted.size > 1) "intents" else "intent"} (sorted $G${BO}best$RST to worst):"))
	}
	else
	logger.info("No matching intent found.")

	sorted.map(m =>
	NCIntentSolverResult(
	m.intentMatch.intent.id,
	m.callback,
	m.intentMatch.tokenGroups.map(grp => NCIntentTokensGroup(grp.term.id, grp.usedTokens.map(_.token))),
	m.variant,
	m.variantIdx
	)
	).toList
	}
	}

	/**
	*
	* @param im
	* @return
	*/
	private def mkPickTokens(im: IntentMatch): List[String] = {
	val buf = mutable.ListBuffer.empty[String]

	val intent = im.intent

	buf += s"intent=${intent.id}"

	var grpIdx = 0

	for (grp <- im.tokenGroups) {
	buf += s" ${grp.term.toAnsiString}"

	grpIdx += 1

	if (grp.usedTokens.nonEmpty) {
	var tokIdx = 0

	for (tok <- grp.usedTokens) {
	val conv = if (tok.conv) "(conv) " else ""

	buf += s" #$tokIdx: $conv${tok.token}"

	tokIdx += 1
	}
	}
	else
	buf += " <empty>"
	}

	buf.toList
	}

	/**
	*
	* @param intent
	* @param senToks
	* @param convToks
	* @return
	*/
	private def solveIntent(
	ctx: NCContext,
	intent: NCIdlIntent,
	senToks: Seq[IntentToken],
	convToks: Seq[IntentToken],
	varIdx: Int
	): Option[IntentMatch] = {
	val intentId = intent.id
	val opts = intent.options
	val flow = NCDialogFlowManager.getDialogFlow(ctx.getRequest.getUser.getId, ctx.getModel.getId)
	val varStr = s"(variant #${varIdx + 1})"
	val flowRegex = intent.flowRegex

	var flowMatched = true

	// Check dialog flow regex first, if any.
	if (intent.flowRegex.isDefined) {
	val str = flow.map(_.getIntentId).mkString(" ")

	def x(s: String): Unit = {
	logger.info(s"Intent '$intentId' $s regex dialog flow $varStr:")
	logger.info(s" \|-- ${c("Intent IDs :")} $str")
	logger.info(s" +-- ${c("Match regex :")} ${flowRegex.get.toString}")
	}

	if (!flowRegex.get.matcher(str).find(0)) {
	x(s"${bo(r("did not match"))}")

	flowMatched = false
	}
	else
	x(s"matched")
	}
	else if (intent.flowMtdName.isDefined) {
	val clsName = intent.flowClsName.orNull
	val mtdName = intent.flowMtdName.get

	val fqn =
	s"${if (clsName == null) ctx.getModel.getClass.getName else clsName}." +
	s"$mtdName(JList[NCDialogFlowItem])"

	val res =
	try
	U.callMethod[JList[NCDialogFlowItem], java.lang.Boolean](
	() => if (clsName == null) ctx.getModel else U.mkObject(clsName),
	mtdName,
	flow.toList.asJava
	)
	catch {
	case e: Exception =>
	throw new NCE(s"Failed to invoke custom flow callback: $fqn", e)
	}

	def x(s: String): Unit = {
	logger.info(s"Intent '$intentId' $s custom flow callback $varStr:")
	logger.info(s" +-- ${c("Custom callback :")} $fqn")
	}

	if (!res) {
	x(s"${bo(r("did not match"))}")

	flowMatched = false
	}
	else
	x("matched")
	}

	if (flowMatched) {
	val intentW = new Weight()
	val intentGrps = mutable.ListBuffer.empty[TermTokensGroup]
	var abort = false
	var lastTermMatch: TermMatch = null

	// Conversation metadata (shared across all terms).
	val x = ctx.getConversation.getMetadata
	val convMeta = if (x.isEmpty) Map.empty[String, Object] else x.asScala.toMap[String, Object]

	// Check terms.
	for (term <- intent.terms if !abort) {
	// Fresh context for each term.
	val termCtx = NCIdlContext(
	intentMeta = intent.meta,
	convMeta = convMeta,
	req = ctx.getRequest,
	vars = mutable.HashMap.empty[String, NCIdlFunction] ++ term.decls
	)

	solveTerm(
	term,
	termCtx,
	senToks,
	if (term.conv) convToks else Seq.empty
	) match {
	case Some(termMatch) =>
	if (opts.ordered && lastTermMatch != null && lastTermMatch.maxIndex > termMatch.maxIndex)
	abort = true
	else {
	// Term is found.
	// Add its weight and grab its tokens.
	intentW += termMatch.weight
	intentGrps += TermTokensGroup(term, termMatch.usedTokens)
	lastTermMatch = termMatch

	val tbl = NCAsciiTable()

	val w = termMatch.weight.toSeq

	tbl += (s"${B}Intent ID$RST", s"$BO${intent.id}$RST")
	tbl += (s"${B}Matched Term$RST", term.toAnsiString)
	tbl += (s"${B}Matched Tokens$RST", termMatch.usedTokens.map(t => {
	val txt = t.token.getOriginalText
	val idx = t.token.getIndex

	s"$txt${c("[" + idx + "]")}"
	}).mkString(" "))
	tbl += (
	s"${B}Term Match Weight$RST",
	s"${y("<")}${w.head}, ${w(1)}, ${w(2)}, ${w(3)}, ${w(4)}, ${w(5)}${y(">")}"
	)

	tbl.info(logger, Some("Term match found:"))
	}

	case None =>
	// Term is missing. Stop further processing for this intent. This intent cannot be matched.
	logger.info(s"Intent '$intentId' ${bo(r("did not match"))} because of unmatched term '${term.toAnsiString}' $varStr.")

	abort = true
	}
	}

	if (abort)
	None
	else {
	val usedSenToks = senToks.filter(_.used)
	val unusedSenToks = senToks.filter(!_.used)
	val usedConvToks = convToks.filter(_.used)

	var res: Option[IntentMatch] = None

	import NCIdlIntentOptions._

	if (!opts.allowStmTokenOnly && usedSenToks.isEmpty && usedConvToks.nonEmpty)
	logger.info(
	s"Intent '$intentId' ${bo(r("did not match"))} because all its matched tokens came from STM $varStr. " +
	s"See intent '${c(JSON_ALLOW_STM_ONLY)}' option."
	)
	else if (!opts.ignoreUnusedFreeWords && unusedSenToks.exists(_.token.isFreeWord))
	NCTokenLogger.prepareTable(
	unusedSenToks.filter(_.token.isFreeWord).map(_.token)
	).
	info(
	logger,
	Some(
	s"Intent '$intentId' ${bo(r("did not match"))} because of unused free words $varStr. " +
	s"See intent '${c(JSON_UNUSED_FREE_WORDS)}' option. " +
	s"Unused free words:"
	)
	)
	else if (!opts.ignoreUnusedUserTokens && unusedSenToks.exists(_.token.isUserDefined))
	NCTokenLogger.prepareTable(
	unusedSenToks.filter(_.token.isUserDefined).map(_.token)
	).
	info(
	logger,
	Some(
	s"Intent '$intentId' ${bo(r("did not match"))} because of unused user tokens $varStr. " +
	s"See intent '${c(JSON_UNUSED_USR_TOKS)}' option. " +
	s"Unused user tokens:"
	)
	)
	else if (!opts.ignoreUnusedSystemTokens && unusedSenToks.exists(tok => !tok.token.isFreeWord && tok.token.isSystemDefined))
	NCTokenLogger.prepareTable(
	unusedSenToks.filter(tok => !tok.token.isFreeWord && tok.token.isSystemDefined).map(_.token)
	).
	info(
	logger,
	Some(
	s"Intent '$intentId' ${bo(r("did not match"))} because of unused system tokens $varStr. " +
	s"See intent '${c(JSON_UNUSED_SYS_TOKS)}' option. " +
	s"Unused system tokens:"
	)
	)
	else {
	if (usedSenToks.isEmpty && usedConvToks.isEmpty)
	logger.warn(s"Intent '$intentId' ${bo(y("matched"))} but no tokens were used $varStr.")

	// Number of remaining (unused) non-free words in the sentence is a measure of exactness of the match.
	// The match is exact when all non-free words are used in that match.
	// Negate to make sure the bigger (smaller negative number) is better.
	val nonFreeWordNum = -senToks.count(t => !t.used && !t.token.isFreeWord)

	intentW.prepend(nonFreeWordNum)

	res = Some(IntentMatch(
	tokenGroups = intentGrps.toList,
	weight = intentW,
	intent = intent
	))
	}

	res
	}
	}
	else
	None
	}

	/**
	* Solves term.
	*
	* @param term
	* @param ctx
	* @param convToks
	* @param senToks
	* @return
	*/
	@throws[NCE]
	private def solveTerm(
	term: NCIdlTerm,
	ctx: NCIdlContext,
	senToks: Seq[IntentToken],
	convToks: Seq[IntentToken]
	): Option[TermMatch] = {
	if (senToks.isEmpty && convToks.isEmpty)
	logger.warn(s"No tokens available to match on for term '${term.toAnsiString}'.")

	try
	solvePredicate(term.pred, ctx, term.min, term.max, senToks, convToks) match {
	case Some((usedToks, predWeight)) => Some(
	TermMatch(
	term.id,
	usedToks,
	// If term match is non-empty we add the following weights:
	// - min
	// - delta between specified max and normalized max (how close the actual quantity was to the specified one).
	// - normalized max
	// NOTE: 'usedToks' can be empty.
	predWeight
	.append(term.min)
	.append(-(term.max - usedToks.size))
	// Normalize max quantifier in case of unbound max.
	.append(if (term.max == Integer.MAX_VALUE) usedToks.size else term.max)
	)
	)

	// Term not found at all.
	case None => None
	}
	catch {
	case e: Exception => throw new NCE(s"Runtime error processing IDL term: ${term.toAnsiString}", e)
	}
	}

	/**
	* Solves term's predicate.
	*
	* @param pred
	* @param ctx
	* @param min
	* @param max
	* @param senToks
	* @param convToks
	* @return
	*/
	@throws[NCE]
	private def solvePredicate(
	pred: (NCToken, NCIdlContext) => Z,
	ctx: NCIdlContext,
	min: Int,
	max: Int,
	senToks: Seq[IntentToken],
	convToks: Seq[IntentToken]
	): Option[(List[IntentToken], Weight)] = {
	// Algorithm is "hungry", i.e. it will fetch all tokens satisfying item's predicate
	// in entire sentence even if these tokens are separated by other already used tokens
	// and conversation will be used only to get to the 'max' number of the item.

	var usedToks = List.empty[IntentToken]

	var matches = 0
	var tokUses = 0

	val allToks = Seq(senToks, convToks)

	// Collect to the 'max' from sentence & conversation, if possible.
	for (col <- allToks; tok <- col.filter(!_.used) if usedToks.lengthCompare(max) < 0) {
	val Z(res, uses) = pred.apply(tok.token, ctx)

	res match {
	case b: java.lang.Boolean =>
	if (b) {
	matches += 1

	if (uses > 0) {
	tokUses += uses
	usedToks :+= tok
	}
	}

	case _ =>
	throw new NCE(s"Predicate returned non-boolean result: $res")
	}
	}

	// We couldn't collect even 'min' matches.
	if (matches < min)
	None
	// Term is optional (min == 0) and no matches found (valid result).
	else if (matches == 0) {
	require(min == 0)
	require(usedToks.isEmpty)

	Some(usedToks -> new Weight(0, 0, 0))
	}
	// We've found some matches (and min > 0).
	else {
	require(matches >= min)

	val convSrvReqIds = convToks.map(_.token.getServerRequestId).distinct

	// Number of tokens from the current sentence.
	val senTokNum = usedToks.count(t => !convSrvReqIds.contains(t.token.getServerRequestId))

	// Sum of conversation depths for each token from the conversation.
	// Negated to make sure that bigger (smaller negative number) is better.
	val convDepthsSum = -usedToks.filter(t => convSrvReqIds.contains(t.token.getServerRequestId)).zipWithIndex.map(_._2 + 1).sum

	// Mark found tokens as used.
	usedToks.foreach(_.used = true)

	Some(usedToks -> new Weight(
	senTokNum,
	convDepthsSum,
	tokUses
	))
	}
	}
	}