Package org.apache.lucene.index

Examples of org.apache.lucene.index.IndexReader.docFreq()


      Term t = textEnum.term();
      if("txt".equals(t.field())) {
        String text = t.text();
        if(TermSets.getClosedClass().contains(text)) continue;
        if(!text.matches(".*[A-Za-z].*")) continue;
        int docFreq = ir.docFreq(t);
        if(docFreq > 1) {
          docFreqs.put(text, ir.docFreq(t));
        }
      }     
    }
View Full Code Here


        String text = t.text();
        if(TermSets.getClosedClass().contains(text)) continue;
        if(!text.matches(".*[A-Za-z].*")) continue;
        int docFreq = ir.docFreq(t);
        if(docFreq > 1) {
          docFreqs.put(text, ir.docFreq(t));
        }
      }     
    }
    List<String> dfl = StringTools.getSortedList(docFreqs);
    Map<String,Integer> termMap = new HashMap<String,Integer>();
View Full Code Here

      Term t = textEnum.term();
      if("txt".equals(t.field())) {
        String text = t.text();
        if(TermSets.getClosedClass().contains(text)) continue;
        if(!text.matches(".*[A-Za-z].*")) continue;
        int docFreq = ir.docFreq(t);
        if(docFreq > 0) {
          docFreqs.put(text, ir.docFreq(t));
        }
      }     
    }
View Full Code Here

        String text = t.text();
        if(TermSets.getClosedClass().contains(text)) continue;
        if(!text.matches(".*[A-Za-z].*")) continue;
        int docFreq = ir.docFreq(t);
        if(docFreq > 0) {
          docFreqs.put(text, ir.docFreq(t));
        }
      }     
    }
    List<String> dfl = StringTools.getSortedList(docFreqs);
    int maxSize = 20000;
View Full Code Here

      Term t = textEnum.term();
      if("txt".equals(t.field())) {
        String text = t.text();
        if(TermSets.getClosedClass().contains(text)) continue;
        if(!text.matches(".*[A-Za-z].*")) continue;
        int docFreq = ir.docFreq(t);
        if(docFreq > 1) {
          docFreqs.put(text, ir.docFreq(t));
        }
      }     
    }
View Full Code Here

        String text = t.text();
        if(TermSets.getClosedClass().contains(text)) continue;
        if(!text.matches(".*[A-Za-z].*")) continue;
        int docFreq = ir.docFreq(t);
        if(docFreq > 1) {
          docFreqs.put(text, ir.docFreq(t));
        }
      }     
    }
    List<String> dfl = StringTools.getSortedList(docFreqs);
   
View Full Code Here

        for(int j=0;j<lm.getColumnDimension();j++) {
          squareLength += Math.pow(lm.get(i, j), 2);
        }
        double distance = Math.sqrt(squareLength);
        String term = dfl.get(i);
        int docFreq = ir.docFreq(new Term("txt", term));
        double score = Math.log(docFreq) * distance;
        if(score > 1.0) distances.put(dfl.get(i), score);
      }
      out.close();
     
View Full Code Here

      Term t = textEnum.term();
      if("txt".equals(t.field())) {
        String text = t.text();
        if(TermSets.getClosedClass().contains(text)) continue;
        if(!text.matches(".*[A-Za-z].*")) continue;
        int docFreq = ir.docFreq(t);
        if(docFreq > 1) {
          docFreqs.put(text, ir.docFreq(t));
        }
      }     
    }
View Full Code Here

        String text = t.text();
        if(TermSets.getClosedClass().contains(text)) continue;
        if(!text.matches(".*[A-Za-z].*")) continue;
        int docFreq = ir.docFreq(t);
        if(docFreq > 1) {
          docFreqs.put(text, ir.docFreq(t));
        }
      }     
    }
    List<String> dfl = StringTools.getSortedList(docFreqs);

View Full Code Here

    //evd.getD().print(6, 2);

    Map<String,Double> termTots = new HashMap<String,Double>();
    for(int i=0;i<evr.length;i++) {
      for(String term : vectors.get(i).keySet()) {
        if(ir.docFreq(new Term("txt", term)) < 10) continue;
        if(!termTots.containsKey(term)) termTots.put(term, 0.0);
        termTots.put(term, termTots.get(term) + (vectors.get(i).get(term)));
      }
    }
    //System.out.println("termTots: " + termTots.size());
View Full Code Here

TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.