基于phantomjs的截图优化JS信息

星期三, 2023-04-05 | Author: Lee | computer, JAVA-and-J2EE, linux | 411 views

phantomjs是比较老的一种模拟抓取及截图,这个是以前处理截图的一种优化js信息做个留档

以后应该是不用了

img.js和rasterize.js两个文件

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
var page = require('webpage').create(), system = require('system'), address, output, size;
 
if (system.args.length < 3 || system.args.length > 5) {
    phantom.exit(1);
} else {
    address = system.args[1];
    output = system.args[2];
    //定义宽高
   /* page.viewportSize = {
        width : 1024,
        height : 768
    };*/
    page.open(address, function(status) {
        var bb = page.evaluate(function() {
            return document.getElementsByTagName('html')[0].getBoundingClientRect();
        });
        page.clipRect = {
            top : bb.top,
            left : bb.left,
            width : bb.width,
            height : bb.height
        };
        window.setTimeout(function() {
            page.render(output);
            page.close();
            console.log('渲染成功...');
            console.log(address);
            phantom.exit();
        }, 1000);
    });
}


rasterize.js

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
var page = require('webpage').create();
var system = require('system');
var address, output, size;
 
if (system.args.length < 3 || system.args.length > 7) {
	console.log('Usage: rasterize.js URL filename paperwidth*paperheight|paperformat portrait|landscape margin zoomfactor');
	console.log('  paperwidth*paperheight|paperformat examples: "5in*7.5in", "10cm*20cm", "A4", "Letter"');
	console.log('  margin examples: "1cm", "2in"');
	phantom.exit(1);
} else {
	address = system.args[1];
	output = system.args[2];
	page.viewportSize = { width: 800, height: 800 };
	//size
	size = system.args[3].split('*');
	page.paperSize =
		size.length === 2 ?
		{ width: size[0], height: size[1], orientation: system.args[4], margin: system.args[5] } :
		{ format: system.args[3], orientation: system.args[4], margin: system.args[5] };
    page.zoomFactor = Number(system.args[6]);
	var statusCode;
 
	page.onResourceReceived = function (resource) {
		if (resource.url === address) {
			statusCode = resource.status;
		}
	};
	page.open(address, function (status) {
 
		if (status !== 'success') {
			console.error('Unable to load the address (' + statusCode + '): ' + address, status);
			return phantom.exit(100);
		} else {
			if (page.evaluate(function () {
				return typeof html2pdf === 'object';
			})) {
				var paperSize = page.paperSize;
				setUpHeaderOrFooter('header');
				setUpHeaderOrFooter('footer');
				page.paperSize = paperSize;
			}
			return window.setTimeout(function () {
				page.render(output);
				phantom.exit();
			}, 1000);
		}
 
		function setUpHeaderOrFooter(headerOrFooter) {
			var hasHeaderOrFooter = page.evaluate(function (headerOrFooter) {
				return typeof html2pdf[headerOrFooter] === 'object';
			}, headerOrFooter);
			if (hasHeaderOrFooter) {
				var height, contents;
				var typeOfHeight = page.evaluate(function (headerOrFooter) {
					return html2pdf[headerOrFooter].height && typeof html2pdf[headerOrFooter].height;
				}, headerOrFooter);
				if (typeOfHeight === 'string') {
					height = page.evaluate(function (headerOrFooter) {
						return html2pdf[headerOrFooter].height;
					}, headerOrFooter);
				} else {
					console.error('html2pdf.' + headerOrFooter + '.height has wrong type: ' + typeOfHeight);
					return phantom.exit(100);
				}
				var typeOfContent = page.evaluate(function (headerOrFooter) {
					return html2pdf[headerOrFooter].contents && typeof html2pdf[headerOrFooter].contents;
				}, headerOrFooter);
				if (typeOfContent === 'string' || typeOfContent === 'function') {
					contents = phantom.callback(function (pageNum, numPages) {
						return getHtmlWithStyles(headerOrFooter, pageNum, numPages);
					});
				} else {
					console.error('html2pdf.' + headerOrFooter + '.contents has wrong type: ' + typeOfContent);
					return phantom.exit(100);
				}
				paperSize[headerOrFooter] = {
					height: height,
					contents: contents
				};
				return null;
			}
		}
 
		function getHtmlWithStyles(headerOrFooter, pageNumber, totalPages) {
			return page.evaluate(function (headerOrFooter, pageNumber, totalPages) {
				var contents = html2pdf[headerOrFooter].contents;
				var html = typeof contents === 'string' ?
					contents :
					html2pdf[headerOrFooter].contents(pageNumber, totalPages);
				html = html
					.replace(/\{\{pagenumber\}\}/gi, pageNumber)
					.replace(/\{\{totalpages\}\}/gi, totalPages);
 
				//Style/footer/Header super-container
				var superHost = document.createElement('div');
				superHost.innerHTML = html;
 
				// Styles will be placed before this element. First styles, then foorter/header elements
				var stylesGoesBefore = superHost.firstChild;
 
				var addStyle = function (styleStr) {
					var newStyle = document.createElement('style');
					newStyle.setAttribute('type', 'text/css');
					newStyle.innerHTML = styleStr;
					stylesGoesBefore.insertBefore( newStyle );
				};
 
				// https://developer.mozilla.org/en-US/docs/Web/API/document.styleSheets
				// https://developer.mozilla.org/en-US/docs/Web/API/StyleSheet.ownerNode
				for (var i = 0; i < document.styleSheets.length; i++) {
					var styleSheet = document.styleSheets[i];
 
					// CSS from style html element
					if (styleSheet.ownerNode.nodeName.toLowerCase() === 'style') {
						var cssStr = styleSheet.ownerNode.innerHTML;
						addStyle( cssStr );
 
					// CSS from link html element
					} else if (styleSheet.ownerNode.nodeName.toLowerCase() === 'link') {
						var xhReq = new XMLHttpRequest();
						xhReq.open('GET', styleSheet.href, false);
						xhReq.send(null);
						var serverResponse = xhReq.responseText;
						addStyle( serverResponse );
					}
				}
 
				return superHost.outerHTML;
			}, headerOrFooter, pageNumber, totalPages);
		}
	});
}

Tags:

文章作者: Lee

本文地址: https://www.pomelolee.com/2349.html

除非注明,Pomelo Lee文章均为原创,转载请以链接形式标明本文地址

No comments yet.

Leave a comment

Search

文章分类

Links

Meta