ctakes-dictionary-lookup-fast/src/main/java/org/apache/ctakes/dictionary/cased/lookup/LookupToken.java - ctakes - Git at Google

 package org.apache.ctakes.dictionary.cased.lookup;


 import org.apache.ctakes.core.util.Pair;
 import org.apache.ctakes.typesystem.type.syntax.BaseToken;

 import javax.annotation.concurrent.Immutable;

 /**
  * @author SPF , chip-nlp
  * @version %I%
  * @since 8/13/2020
  */
 @Immutable
 final public class LookupToken {

    final private Pair<Integer> _textSpan;
    final private String _text;
    final private boolean _allCaps;
    final private boolean _allLower;
    final private boolean _isValidIndexToken;

    public LookupToken( final BaseToken baseToken, final boolean isValidIndexToken ) {
       _textSpan = new Pair<>( baseToken.getBegin(), baseToken.getEnd() );
       // All case-sensitivity is handled here.  This is the text in the note.
       _text = baseToken.getCoveredText();
       boolean anyCaps = false;
       boolean anyLower = false;
       for ( char c : _text.toCharArray() ) {
          if ( Character.isUpperCase( c ) ) {
             anyCaps = true;
          } else if ( Character.isLowerCase( c ) ) {
             anyLower = true;
          }
          if ( anyCaps && anyLower ) {
             break;
          }
       }
       _allCaps = anyCaps && !anyLower;
       _allLower = anyLower && !anyCaps;
       _isValidIndexToken = isValidIndexToken;
    }

    /**
     * @return a span with the start and end indices used for this lookup token
     */
    public Pair<Integer> getTextSpan() {
       return _textSpan;
    }

    /**
     * @return the start index used for this lookup token
     */
    public int getBegin() {
       return _textSpan.getValue1();
    }

    /**
     * @return the end index used for this lookup token
     */
    public int getEnd() {
       return _textSpan.getValue2();
    }

    /**
     * @return the length of the text span in characters
     */
    public int getLength() {
       return _text.length();
    }

    /**
     * @return the actual text in the document for the lookup token, regardless of case.
     */
    public String getText() {
       return _text;
    }

    /**
     * @return the lowercase text in the document for the lookup token, regardless of case.
     */
    public String getLowerText() {
       if ( _allLower ) {
          return _text;
       }
       return _text.toLowerCase();
    }

    /**
     * @return true if the text characters are all upper case.
     */
    public boolean isAllUpperCase() {
       return _allCaps;
    }

    /**
     * @return true if the text characters are all lower case.
     */
    public boolean isAllLowerCase() {
       return _allLower;
    }

    public boolean isValidIndexToken() {
       return _isValidIndexToken;
    }

    /**
     * Two lookup tokens are equal iff the spans are equal.
     *
     * @param value -
     * @return true if {@code value} is a {@code FastLookupToken} and has a span equal to this token's span
     */
    public boolean equals( final Object value ) {
       return value instanceof LookupToken
              && _textSpan.equals( ((LookupToken)value).getTextSpan() );
    }

    /**
     * @return hashCode created from the Span
     */
    public int hashCode() {
       return _textSpan.hashCode();
    }

 }
	package org.apache.ctakes.dictionary.cased.lookup;


	import org.apache.ctakes.core.util.Pair;
	import org.apache.ctakes.typesystem.type.syntax.BaseToken;

	import javax.annotation.concurrent.Immutable;

	/**
	* @author SPF , chip-nlp
	* @version %I%
	* @since 8/13/2020
	*/
	@Immutable
	final public class LookupToken {

	final private Pair<Integer> _textSpan;
	final private String _text;
	final private boolean _allCaps;
	final private boolean _allLower;
	final private boolean _isValidIndexToken;

	public LookupToken( final BaseToken baseToken, final boolean isValidIndexToken ) {
	_textSpan = new Pair<>( baseToken.getBegin(), baseToken.getEnd() );
	// All case-sensitivity is handled here. This is the text in the note.
	_text = baseToken.getCoveredText();
	boolean anyCaps = false;
	boolean anyLower = false;
	for ( char c : _text.toCharArray() ) {
	if ( Character.isUpperCase( c ) ) {
	anyCaps = true;
	} else if ( Character.isLowerCase( c ) ) {
	anyLower = true;
	}
	if ( anyCaps && anyLower ) {
	break;
	}
	}
	_allCaps = anyCaps && !anyLower;
	_allLower = anyLower && !anyCaps;
	_isValidIndexToken = isValidIndexToken;
	}

	/**
	* @return a span with the start and end indices used for this lookup token
	*/
	public Pair<Integer> getTextSpan() {
	return _textSpan;
	}

	/**
	* @return the start index used for this lookup token
	*/
	public int getBegin() {
	return _textSpan.getValue1();
	}

	/**
	* @return the end index used for this lookup token
	*/
	public int getEnd() {
	return _textSpan.getValue2();
	}

	/**
	* @return the length of the text span in characters
	*/
	public int getLength() {
	return _text.length();
	}

	/**
	* @return the actual text in the document for the lookup token, regardless of case.
	*/
	public String getText() {
	return _text;
	}

	/**
	* @return the lowercase text in the document for the lookup token, regardless of case.
	*/
	public String getLowerText() {
	if ( _allLower ) {
	return _text;
	}
	return _text.toLowerCase();
	}

	/**
	* @return true if the text characters are all upper case.
	*/
	public boolean isAllUpperCase() {
	return _allCaps;
	}

	/**
	* @return true if the text characters are all lower case.
	*/
	public boolean isAllLowerCase() {
	return _allLower;
	}

	public boolean isValidIndexToken() {
	return _isValidIndexToken;
	}

	/**
	* Two lookup tokens are equal iff the spans are equal.
	*
	* @param value -
	* @return true if {@code value} is a {@code FastLookupToken} and has a span equal to this token's span
	*/
	public boolean equals( final Object value ) {
	return value instanceof LookupToken
	&& _textSpan.equals( ((LookupToken)value).getTextSpan() );
	}

	/**
	* @return hashCode created from the Span
	*/
	public int hashCode() {
	return _textSpan.hashCode();
	}

	}