本文整理汇总了Java中org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat类的典型用法代码示例。如果您正苦于以下问题:Java DefaultFileNameFormat类的具体用法?Java DefaultFileNameFormat怎么用?Java DefaultFileNameFormat使用的例子?那么, 这里精选的类代码示例或许可以为您提供帮助。
DefaultFileNameFormat类属于org.apache.storm.hdfs.bolt.format包,在下文中一共展示了DefaultFileNameFormat类的15个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Java代码示例。
示例1: createHdfsBolt
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
/**
* Create bolt which will persist ticks to HDFS.
*/
private static HdfsBolt createHdfsBolt() {
// Use "|" instead of "," for field delimiter:
RecordFormat format = new DelimitedRecordFormat()
.withFieldDelimiter("|");
// sync the filesystem after every 1k tuples:
SyncPolicy syncPolicy = new CountSyncPolicy(100);
// Rotate files when they reach 5MB:
FileRotationPolicy rotationPolicy =
new FileSizeRotationPolicy(5.0f, Units.MB);
// Write records to <user>/stock-ticks/ directory in HDFS:
FileNameFormat fileNameFormat = new DefaultFileNameFormat()
.withPath("stock-ticks/");
HdfsBolt hdfsBolt = new HdfsBolt()
.withFsUrl("hdfs://localhost:8020")
.withFileNameFormat(fileNameFormat)
.withRecordFormat(format)
.withRotationPolicy(rotationPolicy)
.withSyncPolicy(syncPolicy);
return hdfsBolt;
}
示例2: createHdfsBolt
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
private static HdfsBolt createHdfsBolt() {
// use "|" instead of "," for field delimiter
RecordFormat format = new DelimitedRecordFormat()
.withFieldDelimiter("|");
// sync the filesystem after every 1k tuples
SyncPolicy syncPolicy = new CountSyncPolicy(1000);
// rotate files when they reach 5MB
FileRotationPolicy rotationPolicy = new FileSizeRotationPolicy(5.0f, FileSizeRotationPolicy.Units.MB);
FileNameFormat fileNameFormat = new DefaultFileNameFormat()
.withPath(Properties.getString("sa.storm.hdfs_output_file"));
return new HdfsBolt()
.withFsUrl(Properties.getString("sa.storm.hdfs_url"))
.withFileNameFormat(fileNameFormat)
.withRecordFormat(format)
.withRotationPolicy(rotationPolicy)
.withSyncPolicy(syncPolicy);
}
示例3: getHdfsBolt
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
public HdfsBolt getHdfsBolt() {
LOG.info("HDFSBOLT: Configuring the HdfsBolt");
// Define the RecordFormat, SyncPolicy, and FileNameFormat
RecordFormat format = new DelimitedRecordFormat().withFieldDelimiter(fieldDelimiter);
SyncPolicy syncPolicy = new CountSyncPolicy(syncCount);
FileNameFormat fileNameFormat = new DefaultFileNameFormat().withPath(outputLocation);
// Configure the Bolt
return new HdfsBolt()
.withFsUrl(hdfsDefaultFs)
.withFileNameFormat(fileNameFormat)
.withRecordFormat(format)
.withRotationPolicy(fileRotationPolicy)
.withSyncPolicy(syncPolicy);
}
示例4: getHdfsBolt
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
public static HdfsBolt getHdfsBolt(String fsUrl, String srcDir, String rotationDir) {
// sync the filesystem after every tuple
SyncPolicy syncPolicy = new CountSyncPolicy(1);
FileNameFormat fileNameFormat = new DefaultFileNameFormat()
.withPath(srcDir)
.withExtension(".txt");
RecordFormat format = new DelimitedRecordFormat().withFieldDelimiter(",");
FileRotationPolicy rotationPolicy = new FileSizeRotationPolicy(1f, FileSizeRotationPolicy.Units.KB);
HdfsBolt bolt = new HdfsBolt()
.withFsUrl(fsUrl)
.withFileNameFormat(fileNameFormat)
.withRecordFormat(format)
.withSyncPolicy(syncPolicy)
.withRotationPolicy(rotationPolicy)
.addRotationAction(new MoveFileAction().toDestination(rotationDir));
return bolt;
}
示例5: configureHdfsBolt
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
public static void configureHdfsBolt(TopologyBuilder builder,
String delimiter,
String outputPath,
String hdfsUri,
String hdfsBoltName,
String spoutName,
int parallelismHint,
FileRotationPolicy rotationPolicy,
int syncCount) {
LOG.info("HDFSBOLT: Configuring the HdfsBolt");
// Define the RecordFormat, SyncPolicy, and FileNameFormat
RecordFormat format = new DelimitedRecordFormat().withFieldDelimiter(delimiter);
SyncPolicy syncPolicy = new CountSyncPolicy(syncCount);
FileNameFormat fileNameFormat = new DefaultFileNameFormat().withPath(outputPath);
// Configure the Bolt
HdfsBolt bolt = new HdfsBolt()
.withFsUrl(hdfsUri)
.withFileNameFormat(fileNameFormat)
.withRecordFormat(format)
.withRotationPolicy(rotationPolicy)
.withSyncPolicy(syncPolicy);
// Set the Bolt
builder.setBolt(hdfsBoltName, bolt, parallelismHint).shuffleGrouping(spoutName);
}
示例6: setup
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
@Before
public void setup() throws IOException {
// Ensure each test has a unique folder to work with.
folder = tempFolder.newFolder();
testFormat = new DefaultFileNameFormat()
.withPath(folder.toString())
.withExtension(".json")
.withPrefix("prefix-");
}
示例7: testWriteSingleFileWithNull
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
@Test
@SuppressWarnings("unchecked")
public void testWriteSingleFileWithNull() throws Exception {
String function = "FORMAT('test-%s/%s', test.key, test.key)";
WriterConfiguration config = buildWriterConfiguration(function);
FileNameFormat format = new DefaultFileNameFormat()
.withPath(folder.toString())
.withExtension(".json")
.withPrefix("prefix-");
HdfsWriter writer = new HdfsWriter().withFileNameFormat(format);
writer.init(new HashMap<String, String>(), createTopologyContext(), config);
// These two messages will be routed to the same folder, because test.key is the same
JSONObject message = new JSONObject();
message.put("test.key2", "test.value2");
ArrayList<JSONObject> messages = new ArrayList<>();
messages.add(message);
ArrayList<Tuple> tuples = new ArrayList<>();
writer.write(SENSOR_NAME, config, tuples, messages);
writer.close();
ArrayList<String> expected = new ArrayList<>();
expected.add(message.toJSONString());
Collections.sort(expected);
File outputFolder = new File(folder.getAbsolutePath() + "/test-null/null/");
Assert.assertTrue(outputFolder.exists() && outputFolder.isDirectory());
Assert.assertEquals(1, outputFolder.listFiles().length);
for(File file : outputFolder.listFiles()) {
List<String> lines = Files.readAllLines(file.toPath());
Collections.sort(lines);
Assert.assertEquals(expected, lines);
}
}
示例8: testGetPath
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
@Test
public void testGetPath() {
FileNameFormat delegate = new DefaultFileNameFormat().withExtension(EXTENSION).withPath(PATH);
FileNameFormat sourceFormat = new PathExtensionFileNameFormat(PATH_EXTENSION, delegate);
String actual = sourceFormat.getPath();
String expected = PATH + "/" + PATH_EXTENSION;
Assert.assertEquals(expected, actual);
}
示例9: testGetPathEmptyPathExtension
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
@Test
public void testGetPathEmptyPathExtension() {
FileNameFormat delegate = new DefaultFileNameFormat().withExtension(EXTENSION).withPath(PATH);
FileNameFormat sourceFormat = new PathExtensionFileNameFormat("", delegate);
String actual = sourceFormat.getPath();
Assert.assertEquals(PATH + "/", actual);
}
示例10: configureHdfsBolt
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
public static void configureHdfsBolt(TopologyBuilder builder, String delimiter, String outputPath, String hdfsUri) {
RecordFormat format = new DelimitedRecordFormat().withFieldDelimiter(delimiter);
SyncPolicy syncPolicy = new CountSyncPolicy(1000);
//FileRotationPolicy rotationPolicy = new TimedRotationPolicy(300, TimedRotationPolicy.TimeUnit.SECONDS);
FileRotationPolicy rotationPolicy = new FileSizeRotationPolicy(1, FileSizeRotationPolicy.Units.KB);
FileNameFormat fileNameFormat = new DefaultFileNameFormat().withPath(outputPath);
HdfsBolt bolt = new HdfsBolt()
.withFsUrl(hdfsUri)
.withFileNameFormat(fileNameFormat)
.withRecordFormat(format)
.withRotationPolicy(rotationPolicy)
.withSyncPolicy(syncPolicy);
builder.setBolt("hdfsbolt", bolt, 1).shuffleGrouping("kafkaspout");
}
示例11: main
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
public static void main(String[] args) {
try{
String zkhost = "wxb-1:2181,wxb-2:2181,wxb-3:2181";
String topic = "order";
String groupId = "id";
int spoutNum = 3;
int boltNum = 1;
ZkHosts zkHosts = new ZkHosts(zkhost);//kafaka所在的zookeeper
SpoutConfig spoutConfig = new SpoutConfig(zkHosts, topic, "/order", groupId); // create /order /id
spoutConfig.scheme = new SchemeAsMultiScheme(new StringScheme());
KafkaSpout kafkaSpout = new KafkaSpout(spoutConfig);
// HDFS bolt
// use "|" instead of "," for field delimiter
RecordFormat format = new DelimitedRecordFormat()
.withFieldDelimiter("|");
// sync the filesystem after every 1k tuples
SyncPolicy syncPolicy = new CountSyncPolicy(1000);
// rotate files when they reach 5MB
FileRotationPolicy rotationPolicy = new FileSizeRotationPolicy(5.0f, FileSizeRotationPolicy.Units.MB);
// FileRotationPolicy rotationPolicy = new TimedRotationPolicy(1.0f, TimedRotationPolicy.TimeUnit.MINUTES);
FileNameFormat fileNameFormat = new DefaultFileNameFormat()
.withPath("/tmp/").withPrefix("order_").withExtension(".log");
HdfsBolt hdfsBolt = new HdfsBolt()
.withFsUrl("hdfs://wxb-1:8020")
.withFileNameFormat(fileNameFormat)
.withRecordFormat(format)
.withRotationPolicy(rotationPolicy)
.withSyncPolicy(syncPolicy);
TopologyBuilder builder = new TopologyBuilder();
builder.setSpout("spout", kafkaSpout, spoutNum);
builder.setBolt("check", new CheckOrderBolt(), boltNum).shuffleGrouping("spout");
builder.setBolt("counter", new CounterBolt(),boltNum).shuffleGrouping("check");
builder.setBolt("hdfs", hdfsBolt,boltNum).shuffleGrouping("counter");
Config config = new Config();
config.setDebug(true);
if(args!=null && args.length > 0) {
config.setNumWorkers(2);
StormSubmitter.submitTopology(args[0], config, builder.createTopology());
} else {
config.setMaxTaskParallelism(2);
LocalCluster cluster = new LocalCluster();
cluster.submitTopology("Wordcount-Topology", config, builder.createTopology());
Thread.sleep(500000);
cluster.shutdown();
}
}catch (Exception e) {
e.printStackTrace();
}
}
示例12: configureHDFSBolt
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
public void configureHDFSBolt(TopologyBuilder builder) {
// Use pipe as record boundary
String rootPath = topologyConfig.getProperty("hdfs.path");
String prefix = topologyConfig.getProperty("hdfs.file.prefix");
String fsUrl = topologyConfig.getProperty("hdfs.url");
String sourceMetastoreUrl = topologyConfig.getProperty("hive.metastore.url");
String hiveStagingTableName = topologyConfig.getProperty("hive.staging.table.name");
String databaseName = topologyConfig.getProperty("hive.database.name");
Float rotationTimeInMinutes = Float.valueOf(topologyConfig.getProperty("hdfs.file.rotation.time.minutes"));
RecordFormat format = new DelimitedRecordFormat().withFieldDelimiter(",");
//Synchronize data buffer with the filesystem every 1000 tuples
SyncPolicy syncPolicy = new CountSyncPolicy(1000);
// Rotate data files when they reach five MB
//FileRotationPolicy rotationPolicy = new FileSizeRotationPolicy(5.0f, Units.MB);
//Rotate every X minutes
FileTimeRotationPolicy rotationPolicy = new FileTimeRotationPolicy(rotationTimeInMinutes, FileTimeRotationPolicy
.Units.MINUTES);
//Hive Partition Action
HiveTablePartitionAction hivePartitionAction = new HiveTablePartitionAction(sourceMetastoreUrl,
hiveStagingTableName, databaseName, fsUrl);
//MoveFileAction moveFileAction = new MoveFileAction().toDestination(rootPath + "/working");
FileNameFormat fileNameFormat = new DefaultFileNameFormat()
.withPath(rootPath + "/staging")
.withPrefix(prefix);
// Instantiate the HdfsBolt
HdfsBolt hdfsBolt = new HdfsBolt()
.withFsUrl(fsUrl)
.withFileNameFormat(fileNameFormat)
.withRecordFormat(format)
.withRotationPolicy(rotationPolicy)
.withSyncPolicy(syncPolicy)
.addRotationAction(hivePartitionAction);
int hdfsBoltCount = Integer.valueOf(topologyConfig.getProperty("hdfsbolt.thread.count"));
builder.setBolt("hdfs_bolt", hdfsBolt, hdfsBoltCount).shuffleGrouping("kafkaSpout");
}
示例13: main
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
public static void main(String[] args) throws AlreadyAliveException, InvalidTopologyException {
String zkIp = "localhost";
String nimbusHost = "sandbox.hortonworks.com";
String zookeeperHost = zkIp +":2181";
ZkHosts zkHosts = new ZkHosts(zookeeperHost);
List<String> zkServers = new ArrayList<String>();
zkServers.add(zkIp);
SpoutConfig kafkaConfig = new SpoutConfig(zkHosts, "spertus-weather-events", "/spertus-weather-events","test_id");
kafkaConfig.scheme = new SchemeAsMultiScheme(new StringScheme());
kafkaConfig.startOffsetTime = kafka.api.OffsetRequest.EarliestTime();
kafkaConfig.zkServers = zkServers;
kafkaConfig.zkRoot = "/spertus-weather-events";
kafkaConfig.zkPort = 2181;
kafkaConfig.forceFromStart = true;
KafkaSpout kafkaSpout = new KafkaSpout(kafkaConfig);
TopologyBuilder builder = new TopologyBuilder();
HdfsBolt hdfsBolt = new HdfsBolt().withFsUrl("hdfs://sandbox.hortonworks.com:8020")
.withFileNameFormat(new DefaultFileNameFormat().withPath("/tmp/test"))
.withRecordFormat(new DelimitedRecordFormat().withFieldDelimiter("|"))
.withSyncPolicy(new CountSyncPolicy(10))
.withRotationPolicy(new FileSizeRotationPolicy(5.0f, Units.MB));
builder.setSpout("raw-weather-events", kafkaSpout, 1);
builder.setBolt("filter-airports", new FilterAirportsBolt(), 1).shuffleGrouping("raw-weather-events");
// builder.setBolt("test-bolt", new TestBolt(), 1).shuffleGrouping("raw-weather-events");
// builder.setBolt("hdfs-bolt", hdfsBolt, 1).shuffleGrouping("raw-weather-events");
Map conf = new HashMap();
conf.put(backtype.storm.Config.TOPOLOGY_WORKERS, 4);
conf.put(backtype.storm.Config.TOPOLOGY_DEBUG, true);
if (args != null && args.length > 0) {
StormSubmitter.submitTopology(args[0], conf, builder.createTopology());
} else {
LocalCluster cluster = new LocalCluster();
cluster.submitTopology("weather-topology", conf, builder.createTopology());
}
}
示例14: testWriteNoOutputFunction
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
@Test
@SuppressWarnings("unchecked")
public void testWriteNoOutputFunction() throws Exception {
FileNameFormat format = new DefaultFileNameFormat()
.withPath(folder.toString())
.withExtension(".json")
.withPrefix("prefix-");
HdfsWriter writer = new HdfsWriter().withFileNameFormat(format);
IndexingConfigurations indexingConfig = new IndexingConfigurations();
WriterConfiguration config = new IndexingWriterConfiguration(WRITER_NAME, indexingConfig);
writer.init(new HashMap<String, String>(), createTopologyContext(), config);
JSONObject message = new JSONObject();
message.put("test.key", "test.value");
message.put("test.key2", "test.value2");
JSONObject message2 = new JSONObject();
message2.put("test.key", "test.value3");
message2.put("test.key2", "test.value2");
ArrayList<JSONObject> messages = new ArrayList<>();
messages.add(message);
messages.add(message2);
ArrayList<Tuple> tuples = new ArrayList<>();
writer.write(SENSOR_NAME, config, tuples, messages);
writer.close();
ArrayList<String> expected = new ArrayList<>();
expected.add(message.toJSONString());
expected.add(message2.toJSONString());
Collections.sort(expected);
// Default to just putting it in the base folder + the sensor name
File outputFolder = new File(folder.getAbsolutePath() + "/" + SENSOR_NAME);
Assert.assertTrue(outputFolder.exists() && outputFolder.isDirectory());
Assert.assertEquals(1, outputFolder.listFiles().length);
for(File file : outputFolder.listFiles()) {
List<String> lines = Files.readAllLines(file.toPath());
Collections.sort(lines);
Assert.assertEquals(expected, lines);
}
}
示例15: testWriteSingleFile
import org.apache.storm.hdfs.bolt.format.DefaultFileNameFormat; //导入依赖的package包/类
@Test
@SuppressWarnings("unchecked")
public void testWriteSingleFile() throws Exception {
String function = "FORMAT('test-%s/%s', test.key, test.key)";
WriterConfiguration config = buildWriterConfiguration(function);
FileNameFormat format = new DefaultFileNameFormat()
.withPath(folder.toString())
.withExtension(".json")
.withPrefix("prefix-");
HdfsWriter writer = new HdfsWriter().withFileNameFormat(format);
writer.init(new HashMap<String, String>(), createTopologyContext(), config);
// These two messages will be routed to the same folder, because test.key is the same
JSONObject message = new JSONObject();
message.put("test.key", "test.value");
message.put("test.key2", "test.value2");
JSONObject message2 = new JSONObject();
message2.put("test.key", "test.value");
message2.put("test.key3", "test.value2");
ArrayList<JSONObject> messages = new ArrayList<>();
messages.add(message);
messages.add(message2);
ArrayList<Tuple> tuples = new ArrayList<>();
writer.write(SENSOR_NAME, config, tuples, messages);
writer.close();
ArrayList<String> expected = new ArrayList<>();
expected.add(message.toJSONString());
expected.add(message2.toJSONString());
Collections.sort(expected);
File outputFolder = new File(folder.getAbsolutePath() + "/test-test.value/test.value/");
Assert.assertTrue(outputFolder.exists() && outputFolder.isDirectory());
Assert.assertEquals(1, outputFolder.listFiles().length);
for(File file : outputFolder.listFiles()) {
List<String> lines = Files.readAllLines(file.toPath());
Collections.sort(lines);
Assert.assertEquals(expected, lines);
}
}