summaryrefslogtreecommitdiff
path: root/crocoite/data/extract-links.js
blob: 5a4f9f02f6766287ecfb5f031ed767309e83c493 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
/*	Extract links from a page
 */

(function () {
/* --- copy&paste from click.js --- */
/*	Element is visible if itself and all of its parents are
 */
function isVisible (o) {
	if (o === null || !(o instanceof Element)) {
		return true;
	}
	let style = window.getComputedStyle (o);
	if ('parentNode' in o) {
		return style.display !== 'none' && isVisible (o.parentNode);
	} else {
		return style.display !== 'none';
	}
}

/*	Elements are considered clickable if they are a) visible and b) not
 *	disabled
 */
function isClickable (o) {
	return !o.hasAttribute ('disabled') && isVisible (o);
}
/* --- end copy&paste */

let ret = [];
['a[href]', 'area[href]'].forEach (function (s) {
	let x = document.querySelectorAll(s);
	for (let i=0; i < x.length; i++) {
		if (isClickable (x[i])) {
			ret.push (x[i].href);
		}
	}
});

/* If Chrome loads plain-text documents it’ll wrap them into <pre>. Check those
 * for links as well, assuming the whole line is a link (i.e. list of links). */
let x = document.querySelectorAll ('body > pre');
for (let i=0; i < x.length; i++) {
	if (isVisible (x[i])) {
		x[i].innerText.split ('\n').forEach (function (s) {
			if (s.match ('^https?://')) {
				ret.push (s);
			}
		});
	}
}
return ret; /* immediately return results, for use with Runtime.evaluate() */
})();