Examples of tokenize()


Examples of opennlp.tools.tokenize.Tokenizer.tokenize()

    return model.eval(mContextGenerator.getContext(text));
  }

  public double[] categorize(String documentText) {
    Tokenizer tokenizer = SimpleTokenizer.INSTANCE;
    return categorize(tokenizer.tokenize(documentText));
  }

  public String getBestCategory(double[] outcome) {
    return model.getBestOutcome(outcome);
  }
View Full Code Here

Examples of opennlp.tools.tokenize.Tokenizer.tokenize()

   */
  public SentencesToTree(String text, TokenizerModel model){
    /* Configure the tokenizer with preloaded model */
    Tokenizer tokenizer = new TokenizerME(model);
    /* tokens has an array of strings, where each string is a token */
    String s = spaces(tokenizer.tokenize(text));
    this.text = this.upperCase(s);
  }
 
  /**
   *
 
View Full Code Here

Examples of opennlp.tools.tokenize.Tokenizer.tokenize()

   * Categorizes the given text. The text is tokenized with the SimpleTokenizer before it
   * is passed to the feature generation.
   */
  public double[] categorize(String documentText) {
    Tokenizer tokenizer = SimpleTokenizer.INSTANCE;
    return categorize(tokenizer.tokenize(documentText));
  }

  public String getBestCategory(double[] outcome) {
    return model.getBestOutcome(outcome);
  }
View Full Code Here

Examples of opennlp.tools.tokenize.TokenizerME.tokenize()

   */
  public SentencesToTree(String text, TokenizerModel model){
    /* Configure the tokenizer with preloaded model */
    Tokenizer tokenizer = new TokenizerME(model);
    /* tokens has an array of strings, where each string is a token */
    String s = spaces(tokenizer.tokenize(text));
    this.text = this.upperCase(s);
  }
 
  /**
   *
 
View Full Code Here

Examples of org.antlr.v4.runtime.tree.pattern.ParseTreePatternMatcher.tokenize()

      rawGenerateAndBuildRecognizer("X1.g4", grammar, "X1Parser", "X1Lexer", false);
    assertTrue(ok);

    ParseTreePatternMatcher m = getPatternMatcher("X1");

    List<? extends Token> tokens = m.tokenize("<ID> = <expr> ;");
    String results = tokens.toString();
    String expected = "[ID:3, [@-1,1:1='=',<1>,1:1], expr:7, [@-1,1:1=';',<2>,1:1]]";
    assertEquals(expected, results);
  }
View Full Code Here

Examples of org.antlr.works.grammar.syntax.GrammarSyntaxLexer.tokenize()

            }

        }

        GrammarSyntaxLexer lexer = new GrammarSyntaxLexer();
        lexer.tokenize(content);

        ParseProperties parser = new ParseProperties();
        parser.parse(lexer.getTokens());
        return parser.propertiesTokens;
    }
View Full Code Here

Examples of org.apache.qpid.framing.AMQShortString.tokenize()

                List<AMQQueue> queueList2 = _wildCardBindingKey2queues.putIfAbsent(routingKey, new CopyOnWriteArrayList<AMQQueue>());

                if(queueList2 == null)
                {
                    queueList2 = _wildCardBindingKey2queues.get(routingKey);
                    AMQShortStringTokenizer keyTok = routingKey.tokenize(TOPIC_SEPARATOR);

                    ArrayList<AMQShortString> keyTokList = new ArrayList<AMQShortString>(keyTok.countTokens());

                    while (keyTok.hasMoreTokens())
                    {
View Full Code Here

Examples of org.apache.stanbol.enhancer.engines.entitylinking.LabelTokenizer.tokenize()

    public String[] tokenize(String label,String language){
        for(ServiceReference ref : getTokenizers(language)){
            LabelTokenizer tokenizer = (LabelTokenizer)labelTokenizerTracker.getService(ref);
            if(tokenizer != null){
                log.trace(" > use Tokenizer {} for language {}",tokenizer.getClass(),language);
                String[] tokens = tokenizer.tokenize(label, language);
                if(tokens != null){
                    if(log.isTraceEnabled()){
                        log.trace("   - tokenized {} -> {}",label, Arrays.toString(tokens));
                    }
                    return tokens;
View Full Code Here

Examples of org.eclipse.assemblyformatter.ir.Formatter.tokenize()

        MessageDialog.openError(shell, e.getClass().getCanonicalName(),
            e.getMessage());
      }

      final String directory = "E:\\assembly-formatter\\debug\\";
      formatter.tokenize();
      try {
        formatter.writeSectionList(directory
            + "section-list tokenize().xml");
      } catch (ParserConfigurationException e) {
        MessageDialog.openError(shell, e.getClass().getCanonicalName(),
View Full Code Here

Examples of org.folg.places.standardize.Normalizer.tokenize()

            StringBuilder reversedWord = new StringBuilder(nextLine);
            reversedWordsWriter.println(reversedWord.reverse());
         }

         if ( (useTokenizer) && (lineCount % TOKENIZE_EVERY_N == 0) ){
            List<List<String>> levels = normalizer.tokenize(nextLine);
            for (List<String> levelWords : levels) {
               tokenizerPlacesCountCC.addAll(levelWords);
               totalTokenizerPlacesCount += levelWords.size();
            }
         }
View Full Code Here
TOP
Copyright © 2018 www.massapi.com. All rights reserved.
All source code are property of their respective owners. Java is a trademark of Sun Microsystems, Inc and owned by ORACLE Inc. Contact coftware#gmail.com.