package com.gentics.cr.lucene.search.highlight;
import java.io.IOException;
import org.apache.log4j.Logger;
import org.apache.lucene.index.IndexReader;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.vectorhighlight.FastVectorHighlighter;
import org.apache.lucene.search.vectorhighlight.FieldQuery;
import org.apache.lucene.search.vectorhighlight.SimpleFragListBuilder;
import org.apache.lucene.search.vectorhighlight.WhitespaceFragmentsBuilder;
import com.gentics.cr.configuration.GenericConfiguration;
import com.gentics.cr.monitoring.MonitorFactory;
import com.gentics.cr.monitoring.UseCase;
/**
* WhitespaceVectorBolder.
* Last changed: $Date: 2009-06-26 15:48:16 +0200 (Fr, 26 Jun 2009) $
* @version $Revision: 105 $
* @author $Author: supnig@constantinopel.at $
*
*/
public class WhitespaceVectorBolder extends AdvancedContentHighlighter {
/**
* Log4j logger for error and debug messages.
*/
private static final Logger LOGGER = Logger.getLogger(WhitespaceVectorBolder.class);
/**
* default value for max frequents.
*/
private static final int DEFAULT_MAX_FRAGMENTS = 3;
/**
* default fragment size.
*/
private static final int DEFAULT_FRAGMENT_SIZE = 100;
/**
* Create new Instance of PhraseBolder.
* @param config config
*/
public WhitespaceVectorBolder(final GenericConfiguration config) {
super(config);
}
/**
* @param parsedQuery query.
* @param reader reader.
* @param docId docid.
* @param fieldName fieldname.
* @return string.
*/
public final String highlight(final Query parsedQuery, final IndexReader reader, final int docId,
final String fieldName) {
UseCase uc = MonitorFactory.startUseCase("Highlight.WhitespaceVectorBolder.highlight()");
StringBuilder result = new StringBuilder();
if (fieldName != null && parsedQuery != null) {
FastVectorHighlighter highlighter = new FastVectorHighlighter(true, true, new SimpleFragListBuilder(),
new WhitespaceFragmentsBuilder(new String[] { getHighlightPrefix() },
new String[] { getHighlightPostfix() }));
FieldQuery fieldQuery = highlighter.getFieldQuery(parsedQuery);
//highlighter.setTextFragmenter(new WordCountFragmenter(fragmentSize));
//TokenStream tokenStream = analyzer.tokenStream(
// this.getHighlightAttribute(), new StringReader(attribute));
try {
UseCase ucFragments = MonitorFactory
.startUseCase("Highlight.WhitespaceVectorBolder.highlight()#getFragments");
//TextFragment[] frags = highlighter.getBestTextFragments(tokenStream,
// attribute, true, numMaxFragments);
String[] frags = highlighter.getBestFragments(
fieldQuery,
reader,
docId,
fieldName,
getFragmentSize(),
getMaxFragments());
ucFragments.stop();
boolean first = true;
if (frags != null) {
for (String frag : frags) {
frag = frag.replaceAll(REMOVE_TEXT_FROM_FRAGMENT_REGEX, "");
if (!first) {
result.append(getFragmentSeperator());
} else {
first = false;
}
result.append(frag);
}
}
} catch (IOException e) {
LOGGER.error("Error getting fragments from highlighter.", e);
}
}
uc.stop();
return result.toString();
}
@Override
protected final int getDefaultFragmentSize() {
return DEFAULT_FRAGMENT_SIZE;
}
@Override
protected final int getDefaultMaxFragments() {
return DEFAULT_MAX_FRAGMENTS;
}
}