Examples of org.apache.lucene.util.AttributeSource

org.apache.lucene.util.AttributeSource
An AttributeSource contains a list of different {@link AttributeImpl}s, and methods to add and get them. There can only be a single instance of an attribute in the same AttributeSource instance. This is ensured by passing in the actual type of the Attribute (Class<Attribute>) to the {@link #addAttribute(Class)}, which then checks if an instance of that type is already present. If yes, it returns the instance, otherwise it creates a new instance and returns it.

      if (!processedTerms.contains(term)) {
        processedTerms.add(term);
        ScoreTermQueue variantsQ = new ScoreTermQueue(MAX_VARIANTS_PER_TERM); //maxNum variants considered for any one term
        float minScore = 0;
        Term startTerm = new Term(f.fieldName, term);
        AttributeSource atts = new AttributeSource();
        MaxNonCompetitiveBoostAttribute maxBoostAtt =
            atts.addAttribute(MaxNonCompetitiveBoostAttribute.class);
        SlowFuzzyTermsEnum fe = new SlowFuzzyTermsEnum(terms, atts, startTerm, f.minSimilarity, f.prefixLength);
        //store the df so all variants use same idf
        int df = reader.docFreq(startTerm);
        int numVariants = 0;
        int totalVariantDocFreqs = 0;

View Full Code Here

        copy( this, replacement.next() );
        return true;
      }


      // common case fast-path of first token not matching anything
      AttributeSource firstTok = nextTok();
      if ( firstTok == null ) {
        return false;
      }
      TermAttribute termAtt = firstTok.addAttribute( TermAttribute.class );
      SynonymMap result = map.submap != null ? map.submap
          .get( termAtt.termBuffer(), 0, termAtt.termLength() ) : null;
      if ( result == null ) {
        copy( this, firstTok );
        return true;
      }


      // fast-path failed, clone ourselves if needed
      if ( firstTok == this ) {
        firstTok = cloneAttributes();
      }
      // OK, we matched a token, so find the longest match.


      matched = new LinkedList<AttributeSource>();


      result = match( result );


      if ( result == null ) {
        // no match, simply return the first token read.
        copy( this, firstTok );
        return true;
      }


      // reuse, or create new one each time?
      ArrayList<AttributeSource> generated = new ArrayList<AttributeSource>( result.synonyms.length + matched.size() + 1 );


      //
      // there was a match... let's generate the new tokens, merging
      // in the matched tokens (position increments need adjusting)
      //
      AttributeSource lastTok = matched.isEmpty() ? firstTok : matched.getLast();
      boolean includeOrig = result.includeOrig();


      AttributeSource origTok = includeOrig ? firstTok : null;
      PositionIncrementAttribute firstPosIncAtt = firstTok.addAttribute( PositionIncrementAttribute.class );
      int origPos = firstPosIncAtt.getPositionIncrement();  // position of origTok in the original stream
      int repPos = 0; // curr position in replacement token stream
      int pos = 0;  // current position in merged token stream


      for ( int i = 0; i < result.synonyms.length; i++ ) {
        Token repTok = result.synonyms[i];
        AttributeSource newTok = firstTok.cloneAttributes();
        TermAttribute newTermAtt = newTok.addAttribute( TermAttribute.class );
        OffsetAttribute newOffsetAtt = newTok.addAttribute( OffsetAttribute.class );
        PositionIncrementAttribute newPosIncAtt = newTok.addAttribute( PositionIncrementAttribute.class );


        OffsetAttribute lastOffsetAtt = lastTok.addAttribute( OffsetAttribute.class );


        newOffsetAtt.setOffset( newOffsetAtt.startOffset(), lastOffsetAtt.endOffset() );
        newTermAtt.setTermBuffer( repTok.termBuffer(), 0, repTok.termLength() );

View Full Code Here


  private SynonymMap match(SynonymMap map) throws IOException {
    SynonymMap result = null;


    if ( map.submap != null ) {
      AttributeSource tok = nextTok();
      if ( tok != null ) {
        // clone ourselves.
        if ( tok == this ) {
          tok = cloneAttributes();
        }
        // check for positionIncrement!=1?  if>1, should not match, if==0, check multiple at this level?
        TermAttribute termAtt = tok.getAttribute( TermAttribute.class );
        SynonymMap subMap = map.submap.get( termAtt.termBuffer(), 0, termAtt.termLength() );


        if ( subMap != null ) {
          // recurse
          result = match( subMap );

View Full Code Here

  protected TermsEnum() {
  }


  /** Returns the related attributes. */
  public AttributeSource attributes() {
    if (atts == null) atts = new AttributeSource();
    return atts;
  }

View Full Code Here

   */
  private DocsEnum getOther(DocsEnum de) {
    if (de == null) {
      return null;
    } else {
      final AttributeSource atts = de.attributes();
      return atts.addAttribute(PulsingEnumAttribute.class).enums().get(this);
    }
  }

View Full Code Here

  /** 
   * for a docsenum, sets the 'other' reused enum.
   * see getOther for an example.
   */
  private DocsEnum setOther(DocsEnum de, DocsEnum other) {
    final AttributeSource atts = de.attributes();
    return atts.addAttribute(PulsingEnumAttribute.class).enums().put(this, other);
  }

View Full Code Here

   * @throws IOException If I/O related errors occur
   */
  protected Collection<ScoreTerm> suggestSimilar(Term term, int numSug, IndexReader ir, int docfreq, int editDistance,
                                                 float accuracy, final CharsRef spare) throws IOException {
    
    AttributeSource atts = new AttributeSource();
    MaxNonCompetitiveBoostAttribute maxBoostAtt =
      atts.addAttribute(MaxNonCompetitiveBoostAttribute.class);
    Terms terms = MultiFields.getTerms(ir, term.field());
    if (terms == null) {
      return Collections.emptyList();
    }
    FuzzyTermsEnum e = new FuzzyTermsEnum(terms, atts, term, editDistance, Math.max(minPrefix, editDistance-1), true);

View Full Code Here

      if (!processedTerms.contains(term)) {
        processedTerms.add(term);
        ScoreTermQueue variantsQ = new ScoreTermQueue(MAX_VARIANTS_PER_TERM); //maxNum variants considered for any one term
        float minScore = 0;
        Term startTerm = new Term(f.fieldName, term);
        AttributeSource atts = new AttributeSource();
        MaxNonCompetitiveBoostAttribute maxBoostAtt =
            atts.addAttribute(MaxNonCompetitiveBoostAttribute.class);
        SlowFuzzyTermsEnum fe = new SlowFuzzyTermsEnum(terms, atts, startTerm, f.minSimilarity, f.prefixLength);
        //store the df so all variants use same idf
        int df = reader.docFreq(startTerm);
        int numVariants = 0;
        int totalVariantDocFreqs = 0;

View Full Code Here

        copy(this, replacement.next());
        return true;
      }


      // common case fast-path of first token not matching anything
      AttributeSource firstTok = nextTok();
      if (firstTok == null) return false;
      CharTermAttribute termAtt = firstTok.addAttribute(CharTermAttribute.class);
      SlowSynonymMap result = map.submap!=null ? map.submap.get(termAtt.buffer(), 0, termAtt.length()) : null;
      if (result == null) {
        copy(this, firstTok);
        return true;
      }


      // fast-path failed, clone ourselves if needed
      if (firstTok == this)
        firstTok = cloneAttributes();
      // OK, we matched a token, so find the longest match.


      matched = new LinkedList<>();


      result = match(result);


      if (result==null) {
        // no match, simply return the first token read.
        copy(this, firstTok);
        return true;
      }


      // reuse, or create new one each time?
      ArrayList<AttributeSource> generated = new ArrayList<>(result.synonyms.length + matched.size() + 1);


      //
      // there was a match... let's generate the new tokens, merging
      // in the matched tokens (position increments need adjusting)
      //
      AttributeSource lastTok = matched.isEmpty() ? firstTok : matched.getLast();
      boolean includeOrig = result.includeOrig();


      AttributeSource origTok = includeOrig ? firstTok : null;
      PositionIncrementAttribute firstPosIncAtt = firstTok.addAttribute(PositionIncrementAttribute.class);
      int origPos = firstPosIncAtt.getPositionIncrement();  // position of origTok in the original stream
      int repPos=0; // curr position in replacement token stream
      int pos=0;  // current position in merged token stream


      for (int i=0; i<result.synonyms.length; i++) {
        Token repTok = result.synonyms[i];
        AttributeSource newTok = firstTok.cloneAttributes();
        CharTermAttribute newTermAtt = newTok.addAttribute(CharTermAttribute.class);
        OffsetAttribute newOffsetAtt = newTok.addAttribute(OffsetAttribute.class);
        PositionIncrementAttribute newPosIncAtt = newTok.addAttribute(PositionIncrementAttribute.class);


        OffsetAttribute lastOffsetAtt = lastTok.addAttribute(OffsetAttribute.class);


        newOffsetAtt.setOffset(newOffsetAtt.startOffset(), lastOffsetAtt.endOffset());
        newTermAtt.copyBuffer(repTok.buffer(), 0, repTok.length());

View Full Code Here


  private SlowSynonymMap match(SlowSynonymMap map) throws IOException {
    SlowSynonymMap result = null;


    if (map.submap != null) {
      AttributeSource tok = nextTok();
      if (tok != null) {
        // clone ourselves.
        if (tok == this)
          tok = cloneAttributes();
        // check for positionIncrement!=1?  if>1, should not match, if==0, check multiple at this level?
        CharTermAttribute termAtt = tok.getAttribute(CharTermAttribute.class);
        SlowSynonymMap subMap = map.submap.get(termAtt.buffer(), 0, termAtt.length());


        if (subMap != null) {
          // recurse
          result = match(subMap);

View Full Code Here

0 1 2 3 4

TOP

Related Classes of org.apache.lucene.util.AttributeSource

org.apache.lucene.analysis.shingle.ShingleFilter

org.apache.lucene.analysis.synonym.SlowSynonymFilter

org.apache.lucene.analysis.synonym.SynonymFilter

org.apache.lucene.codecs.pulsing.PulsingPostingsReader

org.apache.lucene.index.DocsEnum

org.apache.lucene.index.TermsEnum

org.apache.lucene.sandbox.queries.FuzzyLikeThisQuery

org.apache.lucene.sandbox.queries.regex.TestRegexQuery

org.apache.lucene.search.MultiTermQuery

org.apache.lucene.search.spell.DirectSpellChecker

All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.