ScreenCaptureHtmlUnitDriver.java

https://github.com/apache/incubator-zeppelin/blob/master/zeppelin-server/src/test/java/com/webautomation/ScreenCaptureHtmlUnitDriver.java

http://stackoverflow.com/questions/36254656/not-able-to-take-screenshot-using-htmlunitdriver-selenium-webdriver-java

/*
	* Licensed to the Apache Software Foundation (ASF) under one or more
	* contributor license agreements. See the NOTICE file distributed with
	* this work for additional information regarding copyright ownership.
	* The ASF licenses this file to You under the Apache License, Version 2.0
	* (the "License"); you may not use this file except in compliance with
	* the License. You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	package com.webautomation;

	import java.io.ByteArrayOutputStream;
	import java.io.File;
	import java.io.FileOutputStream;
	import java.io.IOException;
	import java.net.URL;
	import java.util.Collections;
	import java.util.HashMap;
	import java.util.Iterator;
	import java.util.LinkedList;
	import java.util.List;
	import java.util.Map;
	import java.util.regex.Matcher;
	import java.util.regex.Pattern;
	import java.util.zip.ZipEntry;
	import java.util.zip.ZipOutputStream;

	import org.apache.commons.io.FilenameUtils;
	import org.apache.commons.io.IOUtils;
	import org.openqa.selenium.Capabilities;
	import org.openqa.selenium.OutputType;
	import org.openqa.selenium.TakesScreenshot;
	import org.openqa.selenium.WebDriverException;
	import org.openqa.selenium.htmlunit.HtmlUnitDriver;
	import org.openqa.selenium.internal.Base64Encoder;
	import org.openqa.selenium.remote.CapabilityType;
	import org.openqa.selenium.remote.DesiredCapabilities;

	import com.gargoylesoftware.htmlunit.BrowserVersion;
	import com.gargoylesoftware.htmlunit.WebClient;
	import com.gargoylesoftware.htmlunit.WebRequest;
	import com.gargoylesoftware.htmlunit.WebWindow;
	import com.gargoylesoftware.htmlunit.html.HtmlElement;
	import com.gargoylesoftware.htmlunit.html.HtmlPage;
	import org.slf4j.Logger;
	import org.slf4j.LoggerFactory;

	/**
	* from https://code.google.com/p/selenium/issues/detail?id=1361
	*/
	public class ScreenCaptureHtmlUnitDriver extends HtmlUnitDriver implements TakesScreenshot {

	private static Map<String, byte[]> imagesCache = Collections.synchronizedMap(new HashMap<String, byte[]>());

	private static Map<String, String> cssjsCache = Collections.synchronizedMap(new HashMap<String, String>());

	// http://stackoverflow.com/questions/4652777/java-regex-to-get-the-urls-from-css
	private final static Pattern cssUrlPattern = Pattern.compile("background(-image)?[\\s]:[^url]url[\\s]\\([\\s]([^\\)])[\\s]\\)[\\s]*");// ?<url>

	static Logger LOGGER = LoggerFactory.getLogger(ScreenCaptureHtmlUnitDriver.class);

	public ScreenCaptureHtmlUnitDriver() {
	super();
	}

	public ScreenCaptureHtmlUnitDriver(boolean enableJavascript) {
	super(enableJavascript);
	}

	public ScreenCaptureHtmlUnitDriver(Capabilities capabilities) {
	super(capabilities);
	}

	public ScreenCaptureHtmlUnitDriver(BrowserVersion version) {
	super(version);
	DesiredCapabilities var = ((DesiredCapabilities) getCapabilities());
	var.setCapability(CapabilityType.TAKES_SCREENSHOT, true);
	}

	@Override
	@SuppressWarnings("unchecked")
	public <X> X getScreenshotAs(OutputType<X> target) throws WebDriverException {
	byte[] archive = new byte[0];
	try {
	archive = downloadCssAndImages(getWebClient(), (HtmlPage) getCurrentWindow().getEnclosedPage());
	} catch (Exception e) {
	LOGGER.error("Exception in ScreenCaptureHtmlUnitDriver while getScreenshotAs ", e);
	}
	if(target.equals(OutputType.BASE64)){
	return target.convertFromBase64Png(new Base64Encoder().encode(archive));
	}
	if(target.equals(OutputType.FILE)){
	File f = new File("screen.tmp");
	try {
	FileOutputStream scr = new FileOutputStream(f);
	scr.write(archive);
	scr.close();
	} catch (IOException e) {
	throw new WebDriverException(e);
	}
	return (X) f;
	}
	return (X) archive;
	}

	// http://stackoverflow.com/questions/2244272/how-can-i-tell-htmlunits-webclient-to-download-images-and-css
	protected byte[] downloadCssAndImages(WebClient webClient, HtmlPage page) throws Exception {
	WebWindow currentWindow = webClient.getCurrentWindow();
	Map<String, String> urlMapping = new HashMap<String, String>();
	Map<String, byte[]> files = new HashMap<String, byte[]>();
	WebWindow window = null;
	try {
	window = webClient.getWebWindowByName(page.getUrl().toString()+"_screenshot");
	webClient.getPage(window, new WebRequest(page.getUrl()));
	} catch (Exception e) {
	LOGGER.error("Exception in ScreenCaptureHtmlUnitDriver while downloadCssAndImages ", e);
	window = webClient.openWindow(page.getUrl(), page.getUrl().toString()+"_screenshot");
	}

	String xPathExpression = "//*[name() = 'img' or name() = 'link' and (@type = 'text/css' or @type = 'image/x-icon') or @type = 'text/javascript']";
	List<?> resultList = page.getByXPath(xPathExpression);

	Iterator<?> i = resultList.iterator();
	while (i.hasNext()) {
	try {
	HtmlElement el = (HtmlElement) i.next();
	String resourceSourcePath = el.getAttribute("src").equals("") ? el.getAttribute("href") : el
	.getAttribute("src");
	if (resourceSourcePath == null \|\| resourceSourcePath.equals(""))
	continue;
	URL resourceRemoteLink = page.getFullyQualifiedUrl(resourceSourcePath);
	String resourceLocalPath = mapLocalUrl(page, resourceRemoteLink, resourceSourcePath, urlMapping);
	urlMapping.put(resourceSourcePath, resourceLocalPath);
	if (!resourceRemoteLink.toString().endsWith(".css")) {
	byte[] image = downloadImage(webClient, window, resourceRemoteLink);
	files.put(resourceLocalPath, image);
	} else {
	String css = downloadCss(webClient, window, resourceRemoteLink);
	for (String cssImagePath : getLinksFromCss(css)) {
	URL cssImagelink = page.getFullyQualifiedUrl(cssImagePath.replace("\"", "").replace("\'", "")
	.replace(" ", ""));
	String cssImageLocalPath = mapLocalUrl(page, cssImagelink, cssImagePath, urlMapping);
	files.put(cssImageLocalPath, downloadImage(webClient, window, cssImagelink));
	}
	files.put(resourceLocalPath, replaceRemoteUrlsWithLocal(css, urlMapping)
	.replace("resources/", "./").getBytes());
	}
	} catch (Exception e) {
	LOGGER.error("Exception in ScreenCaptureHtmlUnitDriver while resultList.iterator ", e);
	}
	}
	String pagesrc = replaceRemoteUrlsWithLocal(page.getWebResponse().getContentAsString(), urlMapping);
	files.put("page.html", pagesrc.getBytes());
	webClient.setCurrentWindow(currentWindow);
	return createZip(files);
	}

	String downloadCss(WebClient webClient, WebWindow window, URL resourceUrl) throws Exception {
	if (cssjsCache.get(resourceUrl.toString()) == null) {
	cssjsCache.put(resourceUrl.toString(), webClient.getPage(window, new WebRequest(resourceUrl))
	.getWebResponse().getContentAsString());

	}
	return cssjsCache.get(resourceUrl.toString());
	}

	byte[] downloadImage(WebClient webClient, WebWindow window, URL resourceUrl) throws Exception {
	if (imagesCache.get(resourceUrl.toString()) == null) {
	imagesCache.put(
	resourceUrl.toString(),
	IOUtils.toByteArray(webClient.getPage(window, new WebRequest(resourceUrl)).getWebResponse()
	.getContentAsStream()));
	}
	return imagesCache.get(resourceUrl.toString());
	}

	public static byte[] createZip(Map<String, byte[]> files) throws IOException {
	ByteArrayOutputStream bos = new ByteArrayOutputStream();
	ZipOutputStream zipfile = new ZipOutputStream(bos);
	Iterator<String> i = files.keySet().iterator();
	String fileName = null;
	ZipEntry zipentry = null;
	while (i.hasNext()) {
	fileName = i.next();
	zipentry = new ZipEntry(fileName);
	zipfile.putNextEntry(zipentry);
	zipfile.write(files.get(fileName));
	}
	zipfile.close();
	return bos.toByteArray();
	}

	List<String> getLinksFromCss(String css) {
	List<String> result = new LinkedList<String>();
	Matcher m = cssUrlPattern.matcher(css);
	while (m.find()) { // find next match
	result.add( m.group(2));
	}
	return result;
	}

	String replaceRemoteUrlsWithLocal(String source, Map<String, String> replacement) {
	for (String object : replacement.keySet()) {
	// background:url(http://org.com/images/image.gif)
	source = source.replace(object, replacement.get(object));
	}
	return source;
	}

	String mapLocalUrl(HtmlPage page, URL link, String path, Map<String, String> replacementToAdd) throws Exception {
	String resultingFileName = "resources/" + FilenameUtils.getName(link.getFile());
	replacementToAdd.put(path, resultingFileName);
	return resultingFileName;
	}

	}

ScreenCaptureHtmlUnitDriver.java的更多相关文章

Spark案例分析
一.需求:计算网页访问量前三名 import org.apache.spark.rdd.RDD import org.apache.spark.{SparkConf, SparkContext} /* ...
故障重现(内存篇2)，JAVA内存不足导致频繁回收和swap引起的性能问题
背景起因: 记起以前的另一次也是关于内存的调优分享下有个系统平时运行非常稳定运行(没经历过大并发考验),然而在一次活动后,人数并发一上来后,系统开始卡. 我按经验开始调优,在每个关键步骤的加入如 ...
Elasticsearch之java的基本操作一
摘要接触ElasticSearch已经有一段了.在这期间,遇到很多问题,但在最后自己的不断探索下解决了这些问题.看到网上或多或少的都有一些介绍ElasticSearch相关知识的文档,但个人觉得 ...
论：开发者信仰之“天下IT是一家“(Java .NET篇)
比尔盖茨公认的IT界领军人物,打造了辉煌一时的PC时代. 2008年,史蒂夫鲍尔默接替了盖茨的工作,成为微软公司的总裁. 2013年他与微软做了最后的道别. 2013年以后,我才真正看到了微软的变化. ...
故障重现, JAVA进程内存不够时突然挂掉模拟
背景,服务器上的一个JAVA服务进程突然挂掉,查看产生了崩溃日志,如下: # Set larger code cache with -XX:ReservedCodeCacheSize= # This ...
死磕内存篇 --- JAVA进程和linux内存间的大小关系
运行个JAVA 用sleep去hold住 package org.hjb.test; public class TestOnly { public static void main(String[] ...
【小程序分享篇一】开发了个JAVA小程序，用于清除内存卡或者U盘里的垃圾文件非常有用
有一种场景, 手机内存卡空间被用光了,但又不知道哪个文件占用了太大,一个个文件夹去找又太麻烦,所以我开发了个小程序把手机所有文件(包括路径下所有层次子文件夹下的文件)进行一个排序,这样你就可以找出哪个 ...
Java多线程基础学习（二）
9. 线程安全/共享变量——同步当多个线程用到同一个变量时,在修改值时存在同时修改的可能性,而此时该变量只能被赋值一次.这就会导致出现“线程安全”问题,这个被多个线程共用的变量称之为“共享变量”. ...
Java多线程基础学习（一）
1. 创建线程 1.1 通过构造函数:public Thread(Runnable target, String name){} 或:public Thread(Runnable target ...

随机推荐

hdu_2243_考研路茫茫——单词情结(AC自动机+矩阵)
题目链接:hdu_2243_考研路茫茫——单词情结题意: 让你求包含这些模式串并且长度不小于L的单词种类题解: 这题是poj2788的升级版,没做过的强烈建议先做那题. 我们用poj2778的方法 ...
开源日志系统比较：scribe、chukwa、kafka、flume
1. 背景介绍许多公司的平台每天会产生大量的日志(一般为流式数据,如,搜索引擎的pv,查询等),处理这些日志需要特定的日志系统,一般而言,这些系统需要具有以下特征: (1) 构建应用系统和分析系统的 ...
find the closest sum to a target value
problem: given an array of integers including positive and negative, a target value. find 2 numbers ...
解决Xcode 9.2系统真机测试时出现 could not find developer disk image问题
解决Xcode在ipad/iphone 9.2 系统真机测试时出现could not find developer disk image问题第一种方法:拷贝这个文件(http://download. ...
JS-如何把字符串转换成数组
var a = "1,22,33,44"; // 字符串 var b = a.split(","); // 将字符串按照","分割,存入数组 ...
【最短路】 poj 2387
#include <iostream> #include <stdlib.h> #include <limits.h> #include <string.h& ...
JS动态引入js、CSS动态创建script/link/style标签
一.动态创建link方式我们可以使用link的方式.如下代码所示. function addCssByLink(url){ var doc=document; var link=doc.create ...
Android开发 R cannot be resolved to a variable问题的分析
R文件是系统自动生成的,如果没出现的话,你的XML文件是不是有错误?是否之前修改过res文件夹下面.xml文件 R文件没有生成的情况有几种: 1.项目没有自动编译:这种时候只需要简单的编译一下工程就会 ...
Linux -- 统计文件的行数
统计单个文件有多少行方法1: awk '{print NR}' test1.sh|tail -n1 方法2: awk 'END{print NR}' test1.sh 方法3: grep -n &q ...
Android平台设计规范整理(尺寸+组成元素+字体+滑块)
转自:http://www.ui.cn/project.php?id=12394

ScreenCaptureHtmlUnitDriver.java

ScreenCaptureHtmlUnitDriver.java的更多相关文章

随机推荐

热门专题