當前位置: 首頁>>代碼示例>>Java>>正文


Java Text.toString方法代碼示例

本文整理匯總了Java中org.apache.hadoop.io.Text.toString方法的典型用法代碼示例。如果您正苦於以下問題:Java Text.toString方法的具體用法?Java Text.toString怎麽用?Java Text.toString使用的例子?那麽, 這裏精選的方法代碼示例或許可以為您提供幫助。您也可以進一步了解該方法所在org.apache.hadoop.io.Text的用法示例。


在下文中一共展示了Text.toString方法的15個代碼示例,這些例子默認根據受歡迎程度排序。您可以為喜歡或者感覺有用的代碼點讚,您的評價將有助於係統推薦出更棒的Java代碼示例。

示例1: WritableSortable

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
public WritableSortable(int j) throws IOException {
  seed = r.nextLong();
  r.setSeed(seed);
  Text t = new Text();
  StringBuilder sb = new StringBuilder();
  indices = new int[j];
  offsets = new int[j];
  check = new String[j];
  DataOutputBuffer dob = new DataOutputBuffer();
  for (int i = 0; i < j; ++i) {
    indices[i] = i;
    offsets[i] = dob.getLength();
    genRandom(t, r.nextInt(15) + 1, sb);
    t.write(dob);
    check[i] = t.toString();
  }
  eob = dob.getLength();
  bytes = dob.getData();
  comparator = WritableComparator.get(Text.class);
}
 
開發者ID:nucypher,項目名稱:hadoop-oss,代碼行數:21,代碼來源:TestIndexedSort.java

示例2: map

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
@Override
protected void map(LongWritable key, Text value, Context context) throws IOException, InterruptedException {
	String doc = value.toString();
				
	String text = slice(doc, "<text", "</text>", true);
	if (text.length() < 1) return;
	
	char txt[] = text.toLowerCase().toCharArray();
	for (int i = 0; i < txt.length; ++i) {
		if (!((txt[i] >= 'a' && txt[i] <= 'z') || (txt[i] >= 'A' && txt[i] <= 'Z')))
			txt[i] = ' ';
	}
	
	String id = slice(doc, "<id>", "</id>", false);
	if (id.length() < 1) return;
	StringTokenizer itr = new StringTokenizer(String.valueOf(txt));
	int sum = itr.countTokens();
	while (itr.hasMoreTokens()) {
		String s = itr.nextToken();
		word.set(id + '-' + s);
		IntWritable tmp[] = {new IntWritable(sum), new IntWritable(1)};
		IntArrayWritable temp = new IntArrayWritable(tmp);
		context.write(word, temp);
	}
}
 
開發者ID:lzmhhh123,項目名稱:Wikipedia-Index,代碼行數:26,代碼來源:TF.java

示例3: reduce

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
public void reduce(IntWritable key, Iterator<Text> values,
    OutputCollector<Text, Text> out,
    Reporter reporter) throws IOException {
  keyVal = key.get();
  while(values.hasNext()) {
    Text value = values.next();
    String towrite = value.toString() + "\n";
    indexStream.write(towrite.getBytes(Charsets.UTF_8));
    written++;
    if (written > numIndexes -1) {
      // every 1000 indexes we report status
      reporter.setStatus("Creating index for archives");
      reporter.progress();
      endIndex = keyVal;
      String masterWrite = startIndex + " " + endIndex + " " + startPos 
                          +  " " + indexStream.getPos() + " \n" ;
      outStream.write(masterWrite.getBytes(Charsets.UTF_8));
      startPos = indexStream.getPos();
      startIndex = endIndex;
      written = 0;
    }
  }
}
 
開發者ID:naver,項目名稱:hadoop,代碼行數:24,代碼來源:HadoopArchives.java

示例4: map

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
@Override
protected void map(LongWritable key, Text value, Context context) throws IOException, InterruptedException {
    String line = value.toString();
    String year = line.substring(15, 19);
    int airTemperature;

    if (line.charAt(87) == '+'){ // parseInt doesn't like leading plus signs
        airTemperature = Integer.parseInt(line.substring(88, 92));
    } else {
        airTemperature = Integer.parseInt(line.substring(87, 92));
    }
    
    String quality = line.substring(92, 93);
    if(airTemperature != MISSING && quality.matches("[01459]")) {
        context.write(new Text(year), new IntWritable(airTemperature));
    }
}
 
開發者ID:myziyue,項目名稱:learn-to-hadoop,代碼行數:18,代碼來源:MaxTemperatureMapper.java

示例5: map

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
/**
 * Emits 3 key-value pairs for counting the word, its length, and the
 * squares of its length. Outputs are (Text, LongWritable).
 * 
 * @param value
 *          This will be a line of text coming in from our input file.
 */
public void map(Object key, Text value, Context context)
    throws IOException, InterruptedException {
  StringTokenizer itr = new StringTokenizer(value.toString());
  while (itr.hasMoreTokens()) {
    String string = itr.nextToken();

    this.wordLen.set(string.length());

    // the square of an integer is an integer...
    this.wordLenSq.set((long) Math.pow(string.length(), 2.0));

    context.write(LENGTH, this.wordLen);
    context.write(SQUARE, this.wordLenSq);
    context.write(COUNT, ONE);
  }
}
 
開發者ID:naver,項目名稱:hadoop,代碼行數:24,代碼來源:WordStandardDeviation.java

示例6: setRenewer

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
public void setRenewer(Text renewer) {
  if (renewer == null) {
    this.renewer = new Text();
  } else {
    HadoopKerberosName renewerKrbName = new HadoopKerberosName(renewer.toString());
    try {
      this.renewer = new Text(renewerKrbName.getShortName());
    } catch (IOException e) {
      throw new RuntimeException(e);
    }
  }
}
 
開發者ID:naver,項目名稱:hadoop,代碼行數:13,代碼來源:AbstractDelegationTokenIdentifier.java

示例7: reduce

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
public void reduce(Text key, Iterator<Text> values,
                   OutputCollector<Text, Text> output, Reporter reporter)
  throws IOException {
  String keyStr = key.toString() + this.fieldSeparator;
  while (values.hasNext()) {
      FieldSelectionHelper helper = new FieldSelectionHelper();
      helper.extractOutputKeyValue(keyStr, values.next().toString(),
        fieldSeparator, reduceOutputKeyFieldList,
        reduceOutputValueFieldList, allReduceValueFieldsFrom, false, false);
    output.collect(helper.getKey(), helper.getValue());
  }
}
 
開發者ID:naver,項目名稱:hadoop,代碼行數:13,代碼來源:FieldSelectionMapReduce.java

示例8: map

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
public void map(Object key, Text value, Context context
    ) throws IOException, InterruptedException {
  StringTokenizer itr = new StringTokenizer(value.toString());
  while (itr.hasMoreTokens()) {
    word.set(itr.nextToken());
    context.write(word, one);
  }
}
 
開發者ID:naver,項目名稱:hadoop,代碼行數:9,代碼來源:TestLocalModeWithNewApis.java

示例9: map

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
/**
 * Emits a key-value pair for counting the word. Outputs are (IntWritable,
 * IntWritable).
 * 
 * @param value
 *          This will be a line of text coming in from our input file.
 */
public void map(Object key, Text value, Context context)
    throws IOException, InterruptedException {
  StringTokenizer itr = new StringTokenizer(value.toString());
  while (itr.hasMoreTokens()) {
    String string = itr.nextToken();
    length.set(string.length());
    context.write(length, ONE);
  }
}
 
開發者ID:naver,項目名稱:hadoop,代碼行數:17,代碼來源:WordMedian.java

示例10: map

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
public void map(Object key, Text value, Context context)
throws IOException, InterruptedException {
    StringTokenizer itr = new StringTokenizer(value.toString());
    while (itr.hasMoreTokens()) {
      word.set(itr.nextToken());
      context.write(word, one);
    }
  }
 
開發者ID:naver,項目名稱:hadoop,代碼行數:9,代碼來源:TestJobCounters.java

示例11: map

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
public void map(K key, Text value,
                OutputCollector<Text, LongWritable> output,
                Reporter reporter)
  throws IOException {
  String text = value.toString();
  Matcher matcher = pattern.matcher(text);
  while (matcher.find()) {
    output.collect(new Text(matcher.group(group)), new LongWritable(1));
  }
}
 
開發者ID:naver,項目名稱:hadoop,代碼行數:11,代碼來源:RegexMapper.java

示例12: map

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
@Override
public void map(Text key, Text value, Context context) throws IOException, InterruptedException{
    String line = key.toString();
    String valueNumber = value.toString();
    int id_position = line.indexOf(",");
    context.write(new Text(line.substring(0, id_position)), new Text(line.substring(id_position+1,line.length())+","+valueNumber));
}
 
開發者ID:dhruvmalik007,項目名稱:Deep_learning_using_Java,代碼行數:8,代碼來源:Recommendation_program.java

示例13: testConvertText

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
@Test
public void testConvertText() {
  Text t = new Text("abc".getBytes());
  String s = t.toString();
  Text t1 = new Text(s);
  assertEquals(t, t1);
}
 
開發者ID:naver,項目名稱:hadoop,代碼行數:8,代碼來源:TestPBHelper.java

示例14: map

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
@Override
public void map(Object key, Text value, Context context
                ) throws IOException, InterruptedException {
  StringTokenizer itr = new StringTokenizer(value.toString());
  while (itr.hasMoreTokens()) {
    word.set(itr.nextToken());
    context.write(word, one);
  }
}
 
開發者ID:naver,項目名稱:hadoop,代碼行數:10,代碼來源:TokenCounterMapper.java

示例15: map

import org.apache.hadoop.io.Text; //導入方法依賴的package包/類
@Override
protected void map(twoDimensionIndexWritable key, Text value, Context context) throws IOException, InterruptedException {
    int m = key.getM();
    int oldTopic = key.getTopic();
    String word = value.toString();
    int index = wordToIndex.get(word);

    docToTopic.getValue(m).setValue(oldTopic,docToTopic.getValue(m).getValue(oldTopic)-1);
    topicToWord.getValue(oldTopic).setValue(index,topicToWord.getValue(oldTopic).getValue(index)-1);

    double[] p = new double[K];
    for(int k = 0; k < K; k++) {
        p[k] = (docToTopic.getValue(m).getValue(k)+alpha)/(MatrixOperations.sumByRow(docToTopic).getValue(m)+K*alpha)
                *(topicToWord.getValue(k).getValue(index)+beta)/(MatrixOperations.sumByRow(topicToWord).getValue(k)+V*beta);
    }
    for(int k = 1; k < K; k++){
        p[k] += p[k - 1];
    }
    double u = Math.random() * p[K - 1]; //p[] is unnormalised
    int newTopic;
    //p當得到當前詞屬於所有主題z的概率分布後,根據這個概率分布為該詞sample一個新的主題,簡單通過隨機采樣選擇一個topic
    for(newTopic = 0; newTopic < K; newTopic++){
        if(u < p[newTopic]){
            break;
        }
    }

    docToTopic.getValue(m).setValue(newTopic,docToTopic.getValue(m).getValue(newTopic)+1);
    topicToWord.getValue(newTopic).setValue(index,topicToWord.getValue(newTopic).getValue(index)+1);
    key.setMatrixKind(MatrixKind.Corpus);
    key.setTopic(newTopic);

    context.write(key, value);

}
 
開發者ID:huyang1,項目名稱:LDA,代碼行數:36,代碼來源:LDAMapper.java


注:本文中的org.apache.hadoop.io.Text.toString方法示例由純淨天空整理自Github/MSDocs等開源代碼及文檔管理平台,相關代碼片段篩選自各路編程大神貢獻的開源項目,源碼版權歸原作者所有,傳播和使用請參考對應項目的License;未經允許,請勿轉載。