当前位置: 首页>>代码示例>>Java>>正文


Java CrawljaxConfigurationBuilder.addPlugin方法代码示例

本文整理汇总了Java中com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder.addPlugin方法的典型用法代码示例。如果您正苦于以下问题:Java CrawljaxConfigurationBuilder.addPlugin方法的具体用法?Java CrawljaxConfigurationBuilder.addPlugin怎么用?Java CrawljaxConfigurationBuilder.addPlugin使用的例子?那么恭喜您, 这里精选的方法代码示例或许可以为您提供帮助。您也可以进一步了解该方法所在com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder的用法示例。


在下文中一共展示了CrawljaxConfigurationBuilder.addPlugin方法的9个代码示例,这些例子默认根据受欢迎程度排序。您可以为喜欢或者感觉有用的代码点赞,您的评价将有助于系统推荐出更棒的Java代码示例。

示例1: main

import com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder; //导入方法依赖的package包/类
public static void main(String[] args) {

		CrawljaxConfigurationBuilder builder =
		        CrawljaxConfiguration.builderFor("http://demo.crawljax.com/");
		builder.addPlugin(new OnNewStatePlugin() {

			@Override
			public void onNewState(CrawlerContext context, StateVertex newState) {
				// This will print the DOM when a new state is detected. You should see it in your
				// console.
				LOG.info("Found a new dom! Here it is:\n{}", context.getBrowser().getStrippedDom());
			}

			@Override
			public String toString() {
				return "Our example plugin";
			}
		});
		CrawljaxRunner crawljax = new CrawljaxRunner(builder.build());
		crawljax.call();
	}
 
开发者ID:aminmf,项目名称:crawljax,代码行数:22,代码来源:PluginExample.java

示例2: main

import com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder; //导入方法依赖的package包/类
/**
 * Run this method to start the crawl.
 */
public static void main(String[] args) {
	CrawljaxConfigurationBuilder builder =
	        CrawljaxConfiguration.builderFor("http://demo.crawljax.com/");

	// Add the invariant that checks that the string isn't present.
	builder.crawlRules().addInvariant(
	        "Detect a string",
	        new NotRegexCondition(
	                "Invariants can be used to perform tests on the current state"));

	// This plugin will just print the error.
	builder.addPlugin(new OnInvariantViolationPlugin() {

		@Override
		public void onInvariantViolation(Invariant invariant, CrawlerContext context) {
			LOG.error("\n\n!!! Invariant {} violated !!!\n", invariant);
		}

	});

	CrawljaxRunner crawljax = new CrawljaxRunner(builder.build());
	crawljax.call();
}
 
开发者ID:aminmf,项目名称:crawljax,代码行数:27,代码来源:InvariantExample.java

示例3: main

import com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder; //导入方法依赖的package包/类
/**
 * Entry point
 */
public static void main(String[] args) {
	CrawljaxConfigurationBuilder builder = CrawljaxConfiguration.builderFor(URL);
	builder.crawlRules().insertRandomDataInInputForms(false);

	builder.crawlRules().click("a");
	builder.crawlRules().click("button");

	// except these
	builder.crawlRules().dontClick("a").underXPath("//DIV[@id='guser']");
	builder.crawlRules().dontClick("a").withText("Language Tools");

	// limit the crawling scope
	builder.setMaximumStates(MAX_NUMBER_STATES);
	builder.setMaximumDepth(MAX_DEPTH);

	builder.addPlugin(new SamplePlugin());

	builder.crawlRules().setInputSpec(getInputSpecification());

	CrawljaxRunner crawljax = new CrawljaxRunner(builder.build());
	crawljax.call();
}
 
开发者ID:aminmf,项目名称:crawljax,代码行数:26,代码来源:Runner.java

示例4: addPlugins

import com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder; //导入方法依赖的package包/类
/**
 * Add the plugins to the given crawljaxConfiguration.
 * 
 * @param crawljaxConfiguration
 *            the configuration to add the plugins to.
 */
protected static void addPlugins(CrawljaxConfigurationBuilder crawljaxConfiguration) {
	crawljaxConfiguration.addPlugin(new PostCrawlStateGraphChecker());

	crawljaxConfiguration.addPlugin(new OnInvariantViolationPlugin() {

		@Override
		public void onInvariantViolation(Invariant invariant, CrawlerContext context) {
			LargeTestBase.violatedInvariants.add(invariant);
			if (context.getBrowser().getStrippedDom().contains(INVARIANT_TEXT)) {
				violatedInvariantStateIsCorrect = true;
				LOG.warn("Invariant violated: " + invariant.getDescription());
			}
		}

	});
}
 
开发者ID:aminmf,项目名称:crawljax,代码行数:23,代码来源:LargeTestBase.java

示例5: newCrawlConfigurationBuilder

import com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder; //导入方法依赖的package包/类
/**
 * Override this method to specify a different configuration.
 * 
 * @return a new {@link CrawljaxConfiguration} to crawl with.
 */
protected CrawljaxConfigurationBuilder newCrawlConfigurationBuilder() {
	CrawljaxConfigurationBuilder builder = CrawljaxConfiguration.builderFor(getUrl());
	builder.crawlRules().clickDefaultElements();
	builder.setUnlimitedRuntime();
	builder.setUnlimitedCrawlDepth();
	builder.addPlugin(new PostCrawlStateGraphChecker());
	return builder;
}
 
开发者ID:aminmf,项目名称:crawljax,代码行数:14,代码来源:BaseCrawler.java

示例6: setup

import com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder; //导入方法依赖的package包/类
@Before
public void setup() {

	CrawljaxConfigurationBuilder builder = SERVER.newConfigBuilder("crawler/index.html");
	builder.addPlugin(new PreStateCrawlingPlugin() {

		@Override
		public void preStateCrawling(CrawlerContext session,
		        ImmutableList<CandidateElement> candidateElements, StateVertex state) {
			for (CandidateElement candidate : candidateElements) {
				HTMLAnchorElementImpl impl = (HTMLAnchorElementImpl) candidate.getElement();
				impl.setName("fail");
				impl.setId("eventually");
				impl.setHref("will");
				impl.setTextContent("This");
				candidate.getIdentification().setValue("/HTML[1]/BODY[1]/FAILED[1]/A[1]");
			}
		}
	});
	builder.addPlugin(new OnFireEventFailedPlugin() {
		@Override
		public void onFireEventFailed(CrawlerContext context, Eventable eventable,
		        List<Eventable> pathToFailure) {
			hits.incrementAndGet();
		}
	});

	controller = new CrawljaxRunner(builder.build());
}
 
开发者ID:aminmf,项目名称:crawljax,代码行数:30,代码来源:OnFireEventFailedPluginTest.java

示例7: configureCrawljax

import com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder; //导入方法依赖的package包/类
/**
 * Set Crawljax configuration here
 * @param builder
 */
private void configureCrawljax(CrawljaxConfigurationBuilder builder) {
	
	CSSCatcher cssCatcher = new CSSCatcher();
	cssCatcher.setOutputFolder(outputFolder + "css/");
	
	builder.addPlugin(new CrawlOverview());
	builder.addPlugin(cssCatcher);
	
	//builder.addPlugin(new LoginPlugin());
	
	//builder.crawlRules().clickDefaultElements();
	//builder.crawlRules().dontClick("input").withAttribute("value", "I don't recognize");
	//builder.crawlRules().click("input").withAttribute("type", "submit");
	//builder.crawlRules().dontClick("a").underXPath("//*[@id='pageFooter']");
	//builder.crawlRules().dontClick("a").underXPath("//*[@id='content']/div/div[2]");
	//System.getProperties().setProperty("webdriver.chrome.driver", "chromedriver.exe");
	//builder.setBrowserConfig(new BrowserConfiguration(BrowserType.CHROME, 2));
	builder.setBrowserConfig(new BrowserConfiguration(BrowserType.FIREFOX, 1));
	builder.crawlRules().insertRandomDataInInputForms(false);
	builder.crawlRules().clickElementsInRandomOrder(false);
	builder.crawlRules().crawlFrames(true);
	builder.crawlRules().dontClick("*");
	
	//com.crawljax.browser.WebDriverBackedEmbeddedBrowser s;
	
	builder.setOutputDirectory(new File(outputFolder + "/crawljax"));
					
	builder.setMaximumDepth(1);
	builder.setMaximumStates(2);
	
	builder.crawlRules().waitAfterReloadUrl(20, TimeUnit.MILLISECONDS);
	builder.crawlRules().waitAfterEvent(200, TimeUnit.MILLISECONDS);
	
}
 
开发者ID:dmazinanian,项目名称:css-analyser,代码行数:39,代码来源:Crawler.java

示例8: main

import com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder; //导入方法依赖的package包/类
/**
 * Run this method to start the crawl.
 * 
 * @throws IOException
 *             when the output folder cannot be created or emptied.
 */
public static void main(String[] args) throws IOException {
	CrawljaxConfigurationBuilder builder = CrawljaxConfiguration.builderFor(URL);
	builder.crawlRules().insertRandomDataInInputForms(false);
	builder.setMaximumRunTime(100, TimeUnit.SECONDS);


	// click these elements
	builder.crawlRules().clickDefaultElements();
	builder.crawlRules().click("div").withAttribute("class", "clickable");

	// but don't click these
	builder.crawlRules().dontClick("a").withAttribute("class", "ignore");
	builder.crawlRules().dontClick("a").underXPath("//DIV[@id='footer']");

	// Set timeouts
	builder.crawlRules().waitAfterReloadUrl(WAIT_TIME_AFTER_RELOAD, TimeUnit.MILLISECONDS);
	builder.crawlRules().waitAfterEvent(WAIT_TIME_AFTER_EVENT, TimeUnit.MILLISECONDS);

	// Add a condition that this XPath doesn't exits
	builder.crawlRules().addCrawlCondition("No spans with foo as class",
	        new NotXPathCondition("//*[@class='foo']"));

	// Set some input for fields
	builder.crawlRules().setInputSpec(getInputSpecification());

	// This will generate a nice output in the output directory.
	File outFolder = new File("output");
	if (outFolder.exists()) {
		FileUtils.deleteDirectory(outFolder);
	}
	builder.setOutputDirectory(outFolder);
	builder.addPlugin(new CrawlOverview());

	// We want to use two browsers simultaneously.
	builder.setBrowserConfig(new BrowserConfiguration(BrowserType.FIREFOX, 1));

	CrawljaxRunner crawljax = new CrawljaxRunner(builder.build());
	crawljax.call();

}
 
开发者ID:aminmf,项目名称:crawljax,代码行数:47,代码来源:AdvancedExample.java

示例9: readConfig

import com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder; //导入方法依赖的package包/类
private CrawljaxConfiguration readConfig(String urlValue, String outputDir) {
	CrawljaxConfigurationBuilder builder = CrawljaxConfiguration.builderFor(urlValue);

	builder.setOutputDirectory(new File(outputDir));

	BrowserType browser = BrowserType.FIREFOX;
	if (options.specifiesBrowser()) {
		browser = options.getSpecifiedBrowser();
	}

	int browsers = 1;
	if (options.specifiesParallelBrowsers()) {
		browsers = options.getSpecifiedNumberOfBrowsers();
	}
	if (browser == BrowserType.REMOTE) {
		String remoteUrl = options.getSpecifiedRemoteBrowser();
		builder.setBrowserConfig(BrowserConfiguration.remoteConfig(browsers, remoteUrl));
	} else {
		builder.setBrowserConfig(new BrowserConfiguration(browser, browsers));
	}

	if (options.specifiesDepth()) {
		builder.setMaximumDepth(options.getSpecifiedDepth());
	}

	if (options.specifiesMaxStates()) {
		builder.setMaximumStates(options.getMaxStates());
	}

	if (options.requestsCrawlHiddenAnchors()) {
		builder.crawlRules().crawlHiddenAnchors(true);
	}

	configureTimers(builder);

	builder.addPlugin(new CrawlOverview());

	if (options.specifiesClickElements()) {
		builder.crawlRules().click(options.getSpecifiedClickElements());
	} else {
		builder.crawlRules().clickDefaultElements();
	}

	return builder.build();
}
 
开发者ID:aminmf,项目名称:crawljax,代码行数:46,代码来源:JarRunner.java


注:本文中的com.crawljax.core.configuration.CrawljaxConfiguration.CrawljaxConfigurationBuilder.addPlugin方法示例由纯净天空整理自Github/MSDocs等开源代码及文档管理平台,相关代码片段筛选自各路编程大神贡献的开源项目,源码版权归原作者所有,传播和使用请参考对应项目的License;未经允许,请勿转载。