當前位置: 首頁>>代碼示例>>Java>>正文


Java AttributeSource.State方法代碼示例

本文整理匯總了Java中org.apache.lucene.util.AttributeSource.State方法的典型用法代碼示例。如果您正苦於以下問題:Java AttributeSource.State方法的具體用法?Java AttributeSource.State怎麽用?Java AttributeSource.State使用的例子?那麽, 這裏精選的方法代碼示例或許可以為您提供幫助。您也可以進一步了解該方法所在org.apache.lucene.util.AttributeSource的用法示例。


在下文中一共展示了AttributeSource.State方法的15個代碼示例,這些例子默認根據受歡迎程度排序。您可以為喜歡或者感覺有用的代碼點讚,您的評價將有助於係統推薦出更棒的Java代碼示例。

示例1: incrementToken

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
@Override
public boolean incrementToken() throws IOException {
  if (input.incrementToken()) {
    // capture state lazily - maybe no SinkFilter accepts this state
    AttributeSource.State state = null;
    for (WeakReference<SinkTokenStream> ref : sinks) {
      final SinkTokenStream sink = ref.get();
      if (sink != null) {
        if (sink.accept(this)) {
          if (state == null) {
            state = this.captureState();
          }
          sink.addState(state);
        }
      }
    }
    return true;
  }
  
  return false;
}
 
開發者ID:lamsfoundation,項目名稱:lams,代碼行數:22,代碼來源:TeeSinkTokenFilter.java

示例2: incrementToken

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
@Override
public final boolean incrementToken() throws IOException {
  if (cache == null) {
    // fill cache lazily
    cache = new LinkedList<AttributeSource.State>();
    fillCache();
    iterator = cache.iterator();
  }
  
  if (!iterator.hasNext()) {
    // the cache is exhausted, return false
    return false;
  }
  // Since the TokenFilter can be reset, the tokens need to be preserved as immutable.
  restoreState(iterator.next());
  return true;
}
 
開發者ID:gncloud,項目名稱:fastcatsearch3,代碼行數:18,代碼來源:CachingTokenFilter.java

示例3: end

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
@Override
public final void end() throws IOException {
  super.end();
  AttributeSource.State finalState = captureState();
  for (WeakReference<SinkTokenStream> ref : sinks) {
    final SinkTokenStream sink = ref.get();
    if (sink != null) {
      sink.setFinalState(finalState);
    }
  }
}
 
開發者ID:lamsfoundation,項目名稱:lams,代碼行數:12,代碼來源:TeeSinkTokenFilter.java

示例4: incrementToken

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
@Override
public final boolean incrementToken() throws IOException {
  if (tokens != null && tokens.hasNext()){
    AttributeSource.State state = tokens.next();
    restoreState(state);
    return true;
  }
  clearAttributes();
  int tokenType = scanner.getNextToken();

  if (tokenType == WikipediaTokenizerImpl.YYEOF) {
    return false;
  }
  String type = WikipediaTokenizerImpl.TOKEN_TYPES[tokenType];
  if (tokenOutput == TOKENS_ONLY || untokenizedTypes.contains(type) == false){
    setupToken();
  } else if (tokenOutput == UNTOKENIZED_ONLY && untokenizedTypes.contains(type) == true){
    collapseTokens(tokenType);

  }
  else if (tokenOutput == BOTH){
    //collapse into a single token, add it to tokens AND output the individual tokens
    //output the untokenized Token first
    collapseAndSaveTokens(tokenType, type);
  }
  int posinc = scanner.getPositionIncrement();
  if (first && posinc == 0) {
    posinc = 1; // don't emit posinc=0 for the first token!
  }
  posIncrAtt.setPositionIncrement(posinc);
  typeAtt.setType(type);
  first = false;
  return true;
}
 
開發者ID:lamsfoundation,項目名稱:lams,代碼行數:35,代碼來源:WikipediaTokenizer.java

示例5: collapseAndSaveTokens

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
private void collapseAndSaveTokens(int tokenType, String type) throws IOException {
  //collapse
  StringBuilder buffer = new StringBuilder(32);
  int numAdded = scanner.setText(buffer);
  //TODO: how to know how much whitespace to add
  int theStart = scanner.yychar();
  int lastPos = theStart + numAdded;
  int tmpTokType;
  int numSeen = 0;
  List<AttributeSource.State> tmp = new ArrayList<>();
  setupSavedToken(0, type);
  tmp.add(captureState());
  //while we can get a token and that token is the same type and we have not transitioned to a new wiki-item of the same type
  while ((tmpTokType = scanner.getNextToken()) != WikipediaTokenizerImpl.YYEOF && tmpTokType == tokenType && scanner.getNumWikiTokensSeen() > numSeen){
    int currPos = scanner.yychar();
    //append whitespace
    for (int i = 0; i < (currPos - lastPos); i++){
      buffer.append(' ');
    }
    numAdded = scanner.setText(buffer);
    setupSavedToken(scanner.getPositionIncrement(), type);
    tmp.add(captureState());
    numSeen++;
    lastPos = currPos + numAdded;
  }
  //trim the buffer
  // TODO: this is inefficient
  String s = buffer.toString().trim();
  termAtt.setEmpty().append(s);
  offsetAtt.setOffset(correctOffset(theStart), correctOffset(theStart + s.length()));
  flagsAtt.setFlags(UNTOKENIZED_TOKEN_FLAG);
  //The way the loop is written, we will have proceeded to the next token.  We need to pushback the scanner to lastPos
  if (tmpTokType != WikipediaTokenizerImpl.YYEOF){
    scanner.yypushback(scanner.yylength());
  }
  tokens = tmp.iterator();
}
 
開發者ID:lamsfoundation,項目名稱:lams,代碼行數:38,代碼來源:WikipediaTokenizer.java

示例6: swap

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
@Override
protected void swap(int i, int j) {
  AttributeSource.State tmp = buffered[i];
  buffered[i] = buffered[j];
  buffered[j] = tmp;
  
  int tmp2 = startOff[i];
  startOff[i] = startOff[j];
  startOff[j] = tmp2;
  
  tmp2 = posInc[i];
  posInc[i] = posInc[j];
  posInc[j] = tmp2;
}
 
開發者ID:lamsfoundation,項目名稱:lams,代碼行數:15,代碼來源:WordDelimiterFilter.java

示例7: incrementToken

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
@Override
public final boolean incrementToken() {
  // lazy init the iterator
  if (it == null) {
    it = cachedStates.iterator();
  }

  if (!it.hasNext()) {
    return false;
  }
  
  AttributeSource.State state = (State) it.next();
  restoreState(state.clone());
  return true;
}
 
開發者ID:europeana,項目名稱:search,代碼行數:16,代碼來源:PreAnalyzedField.java

示例8: collapseAndSaveTokens

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
private void collapseAndSaveTokens(int tokenType, String type) throws IOException {
  //collapse
  StringBuilder buffer = new StringBuilder(32);
  int numAdded = scanner.setText(buffer);
  //TODO: how to know how much whitespace to add
  int theStart = scanner.yychar();
  int lastPos = theStart + numAdded;
  int tmpTokType;
  int numSeen = 0;
  List<AttributeSource.State> tmp = new ArrayList<AttributeSource.State>();
  setupSavedToken(0, type);
  tmp.add(captureState());
  //while we can get a token and that token is the same type and we have not transitioned to a new wiki-item of the same type
  while ((tmpTokType = scanner.getNextToken()) != WikipediaTokenizerImpl.YYEOF && tmpTokType == tokenType && scanner.getNumWikiTokensSeen() > numSeen){
    int currPos = scanner.yychar();
    //append whitespace
    for (int i = 0; i < (currPos - lastPos); i++){
      buffer.append(' ');
    }
    numAdded = scanner.setText(buffer);
    setupSavedToken(scanner.getPositionIncrement(), type);
    tmp.add(captureState());
    numSeen++;
    lastPos = currPos + numAdded;
  }
  //trim the buffer
  // TODO: this is inefficient
  String s = buffer.toString().trim();
  termAtt.setEmpty().append(s);
  offsetAtt.setOffset(correctOffset(theStart), correctOffset(theStart + s.length()));
  flagsAtt.setFlags(UNTOKENIZED_TOKEN_FLAG);
  //The way the loop is written, we will have proceeded to the next token.  We need to pushback the scanner to lastPos
  if (tmpTokType != WikipediaTokenizerImpl.YYEOF){
    scanner.yypushback(scanner.yylength());
  }
  tokens = tmp.iterator();
}
 
開發者ID:yintaoxue,項目名稱:read-open-source-code,代碼行數:38,代碼來源:WikipediaTokenizer.java

示例9: incrementToken

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
@Override
public final boolean incrementToken() {
  // lazy init the iterator
  if (it == null) {
    it = cachedStates.iterator();
  }

  if (!it.hasNext()) {
    return false;
  }
  
  AttributeSource.State state = it.next();
  restoreState(state);
  return true;
}
 
開發者ID:yintaoxue,項目名稱:read-open-source-code,代碼行數:16,代碼來源:TeeSinkTokenFilter.java

示例10: addState

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
private void addState(AttributeSource.State state) {
  if (it != null) {
    throw new IllegalStateException("The tee must be consumed before sinks are consumed.");
  }
  cachedStates.add(state);
}
 
開發者ID:lamsfoundation,項目名稱:lams,代碼行數:7,代碼來源:TeeSinkTokenFilter.java

示例11: setFinalState

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
private void setFinalState(AttributeSource.State finalState) {
  this.finalState = finalState;
}
 
開發者ID:lamsfoundation,項目名稱:lams,代碼行數:4,代碼來源:TeeSinkTokenFilter.java

示例12: add

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
public void add(AttributeSource.State state) {
  inputTokens.add(state);
}
 
開發者ID:europeana,項目名稱:search,代碼行數:4,代碼來源:LookaheadTokenFilter.java

示例13: nextState

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
public AttributeSource.State nextState() {
  assert nextRead < inputTokens.size();
  return inputTokens.get(nextRead++);
}
 
開發者ID:europeana,項目名稱:search,代碼行數:5,代碼來源:LookaheadTokenFilter.java

示例14: createState

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
private static AttributeSource.State createState(AttributeSource a, Tok state, int tokenEnd) {
  a.clearAttributes();
  CharTermAttribute termAtt = a.addAttribute(CharTermAttribute.class);
  char[] tokChars = state.token.toString().toCharArray();
  termAtt.copyBuffer(tokChars, 0, tokChars.length);
  int tokenStart = tokenEnd - state.token.length();
  for (Entry<String, String> e : state.attr.entrySet()) {
    String k = e.getKey();
    if (k.equals("i")) {
      // position increment
      int incr = Integer.parseInt(e.getValue());
      PositionIncrementAttribute posIncr = a.addAttribute(PositionIncrementAttribute.class);
      posIncr.setPositionIncrement(incr);
    } else if (k.equals("s")) {
      tokenStart = Integer.parseInt(e.getValue());
    } else if (k.equals("e")) {
      tokenEnd = Integer.parseInt(e.getValue());
    } else if (k.equals("y")) {
      TypeAttribute type = a.addAttribute(TypeAttribute.class);
      type.setType(e.getValue());
    } else if (k.equals("f")) {
      FlagsAttribute flags = a.addAttribute(FlagsAttribute.class);
      int f = Integer.parseInt(e.getValue(), 16);
      flags.setFlags(f);
    } else if (k.equals("p")) {
      PayloadAttribute p = a.addAttribute(PayloadAttribute.class);
      byte[] data = hexToBytes(e.getValue());
      if (data != null && data.length > 0) {
        p.setPayload(new BytesRef(data));
      }
    } else {
      // unknown attribute
    }
  }
  // handle offset attr
  OffsetAttribute offset = a.addAttribute(OffsetAttribute.class);
  offset.setOffset(tokenStart, tokenEnd);
  State resState = a.captureState();
  a.clearAttributes();
  return resState;
}
 
開發者ID:europeana,項目名稱:search,代碼行數:42,代碼來源:SimplePreAnalyzedParser.java

示例15: nextState

import org.apache.lucene.util.AttributeSource; //導入方法依賴的package包/類
public AttributeSource.State nextState() {
	assert nextRead < inputTokens.size();
	return inputTokens.get(nextRead++);
}
 
開發者ID:easynet-cn,項目名稱:resource-query-parser,代碼行數:5,代碼來源:LookaheadTokenFilter.java


注:本文中的org.apache.lucene.util.AttributeSource.State方法示例由純淨天空整理自Github/MSDocs等開源代碼及文檔管理平台,相關代碼片段篩選自各路編程大神貢獻的開源項目,源碼版權歸原作者所有,傳播和使用請參考對應項目的License;未經允許,請勿轉載。