-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathreport-mixed-content.js
executable file
·121 lines (94 loc) · 3.56 KB
/
report-mixed-content.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
#!/usr/bin/env phantomjs --disk-cache=true --ignore-ssl-errors=false --load-images=true --output-encoding=utf-8
'use strict';
var system = require('system'),
webpage = require('webpage');
var args = system.args,
URLs = [];
args.slice(1).forEach(function(url) {
if (url.substr(0, 8) !== 'https://') {
console.debug('Rewriting HTTP URL to use HTTPS:', url);
url = url.replace('http:', 'https:');
}
URLs.push(url);
});
if (URLs.length < 1) {
console.log('Usage:', args[0], 'URL [URL2]');
phantom.exit(1);
}
function initPage() {
var page = new WebPage();
page.onResourceRequested = function(requestData, networkRequest) {
var originalURL = currentURL = requestData.url;
var currentPageURL = page.url || page.originalURL;
if (originalURL.match(/^http:\/\/cdn\.loc\.gov/)) {
currentURL = originalURL.replace('http://cdn.loc.gov', 'https://cdn.loc.gov');
console.log('🔸 ', currentPageURL, 'rewrote insecure CDN resource to:', currentURL);
networkRequest.changeUrl(newURL);
}
if (currentURL.substr(0, 8) !== 'https://' && currentURL.substr(0, 5) !== 'data:') {
console.log('❗️ ', currentPageURL, 'loaded an insecure resource:', originalURL);
}
};
page.onError = function (msg, trace) {
logError('🌋 Page error:', msg);
trace.forEach(function(item) {
logError(' ', item.file, ':', item.line);
});
};
page.onConsoleMessage = function(msg) {
if (msg == 'GOTO_NEXT_PAGE') {
page.close();
crawlNextPage();
} else if (msg.indexOf('insecure content from') >= 0) {
// We can format WebKit's native error messages nicely:
console.log('❕ ', msg.trim().replace('The page at ', ''));
} else {
console.log('\t💻', msg);
}
};
return page;
}
function crawlNextPage() {
if (URLs.length < 1) {
console.log('… done!');
phantom.exit();
}
var url = URLs.shift();
var page = initPage();
console.log('Opening', url, '(' + URLs.length + ' remaining)');
page.onInitialized = function() {
page.evaluate(function(startTime) {
/* global window */
// This can happen with things like error pages which have no linked resources to load by the
// time that our JavaScript starts executing:
if (document.readyState == 'complete') {
console.log('GOTO_NEXT_PAGE');
}
document.addEventListener('DOMContentLoaded', function() {
console.log('DOMContentLoaded', ((Date.now() - startTime) / 1000).toFixed(3) + 's');
});
window.addEventListener('load', function() {
console.log('load', ((Date.now() - startTime) / 1000).toFixed(3) + 's');
window.setTimeout(function () {
console.log('GOTO_NEXT_PAGE');
}, 500);
});
window.setTimeout(function () {
console.log('👎 Aborting page load after one minute');
console.log('GOTO_NEXT_PAGE');
}, 60 * 1000);
}, Date.now());
};
page.originalURL = url;
page.open(url, function (status) {
if (status === 'success') {
console.log('✅ ', url);
// Do nothing at this point until the load event fires
} else {
console.log('❌ ', url);
page.close();
crawlNext();
}
});
}
crawlNextPage();