Revision 96efcc33
Added by koszko over 1 year ago
| content/policy_enforcing.js | ||
|---|---|---|
| 45 | 45 |
|
| 46 | 46 |
#FROM common/misc.js IMPORT gen_nonce, csp_header_regex |
| 47 | 47 |
|
| 48 |
const html_ns = "http://www.w3.org/1999/xhtml"; |
|
| 49 |
const svg_ns = "http://www.w3.org/2000/svg"; |
|
| 50 |
|
|
| 48 | 51 |
document.content_loaded = document.readyState === "complete"; |
| 49 | 52 |
const wait_loaded = e => e.content_loaded ? Promise.resolve() : |
| 50 | 53 |
new Promise(c => e.addEventListener("DOMContentLoaded", c, {once: true}));
|
| ... | ... | |
| 203 | 206 |
*/ |
| 204 | 207 |
if (some_attr_blocked) {
|
| 205 | 208 |
const replacement_elem = document.createElement("a");
|
| 209 |
|
|
| 210 |
/* Prevent this node from being processed by our observer. */ |
|
| 211 |
replacement_elem.haketilo_trusted_node = true; |
|
| 212 |
|
|
| 206 | 213 |
element.replaceWith(replacement_elem); |
| 207 | 214 |
replacement_elem.replaceWith(element); |
| 208 | 215 |
} |
| ... | ... | |
| 221 | 228 |
element.haketilo_sanitized_onevent = true; |
| 222 | 229 |
|
| 223 | 230 |
for (const attribute_node of [...(element.attributes || [])]) {
|
| 224 |
const attr = attribute_node.localName, attr_lo = attr.toLowerCase();;
|
|
| 225 |
if (!/^on/.test(attr_lo) || !(attr_lo in element.wrappedJSObject))
|
|
| 231 |
const attr = attribute_node.localName, attr_lo = attr.toLowerCase(); |
|
| 232 |
if (!/^on/.test(attr_lo) || !(attr_lo in element)) |
|
| 226 | 233 |
continue; |
| 227 | 234 |
|
| 228 | 235 |
/* |
| ... | ... | |
| 246 | 253 |
} |
| 247 | 254 |
#ENDIF |
| 248 | 255 |
|
| 249 |
function start_mo_sanitizing(doc) {
|
|
| 250 |
if (!doc.content_loaded) {
|
|
| 251 |
function mutation_handler(mutation) {
|
|
| 252 |
mutation.addedNodes.forEach(sanitize_element_urls); |
|
| 256 |
/* |
|
| 257 |
* Sanitize elements on-the-fly as they appear using MutationObserver. |
|
| 258 |
* |
|
| 259 |
* Under Abrowser 97 it was observed that MutationObserver does not always work |
|
| 260 |
* as is should. When trying to observe nodes of an XMLDocument the behavior was |
|
| 261 |
* as if the "subtree" option to MutationObserver.observe() was ignored. To work |
|
| 262 |
* around this we avoid using the "subtree" option altogether and have the same |
|
| 263 |
* code work in all scenarios. |
|
| 264 |
*/ |
|
| 265 |
function MOSanitizer(root) {
|
|
| 266 |
this.root = root; |
|
| 267 |
|
|
| 268 |
this.recursively_sanitize(root); |
|
| 269 |
|
|
| 270 |
this.mo = new MutationObserver(ms => this.handle_mutations(ms)); |
|
| 271 |
} |
|
| 272 |
|
|
| 273 |
MOSanitizer.prototype.observe = function() {
|
|
| 274 |
let elem = this.root; |
|
| 275 |
while (elem && !elem.haketilo_trusted_node) {
|
|
| 276 |
this.mo.observe(elem, {childList: true});
|
|
| 277 |
elem = elem.lastElementChild; |
|
| 278 |
} |
|
| 279 |
} |
|
| 280 |
|
|
| 281 |
MOSanitizer.prototype.handle_mutations = function(mutations) {
|
|
| 282 |
for (const mut of mutations) {
|
|
| 283 |
for (const new_node of mut.addedNodes) |
|
| 284 |
this.recursively_sanitize(new_node); |
|
| 285 |
} |
|
| 286 |
|
|
| 287 |
this.mo.disconnect(); |
|
| 288 |
this.observe(); |
|
| 289 |
} |
|
| 290 |
|
|
| 291 |
MOSanitizer.prototype.recursively_sanitize = function(elem) {
|
|
| 292 |
const to_process = [elem]; |
|
| 293 |
|
|
| 294 |
while (to_process.length > 0) {
|
|
| 295 |
const current_elem = to_process.pop(); |
|
| 296 |
|
|
| 297 |
if (current_elem.haketilo_trusted_node || |
|
| 298 |
current_elem.nodeType !== this.root.ELEMENT_NODE) |
|
| 299 |
continue; |
|
| 300 |
|
|
| 301 |
to_process.push(...current_elem.children); |
|
| 302 |
|
|
| 303 |
sanitize_element_urls(current_elem); |
|
| 253 | 304 |
#IF MOZILLA |
| 254 |
mutation.addedNodes.forEach(sanitize_element_onevent);
|
|
| 305 |
sanitize_element_onevent(current_elem);
|
|
| 255 | 306 |
#ENDIF |
| 256 |
} |
|
| 257 |
const mo = new MutationObserver(ms => ms.forEach(mutation_handler)); |
|
| 258 |
mo.observe(doc, {childList: true, subtree: true});
|
|
| 259 |
wait_loaded(doc).then(() => mo.disconnect()); |
|
| 260 | 307 |
} |
| 261 | 308 |
} |
| 262 | 309 |
|
| 310 |
MOSanitizer.prototype.start = function() {
|
|
| 311 |
this.recursively_sanitize(this.root); |
|
| 312 |
this.observe(); |
|
| 313 |
} |
|
| 314 |
|
|
| 315 |
MOSanitizer.prototype.stop = function() {
|
|
| 316 |
this.mo.disconnect(); |
|
| 317 |
} |
|
| 318 |
|
|
| 263 | 319 |
#IF MOZILLA |
| 264 | 320 |
/* |
| 265 | 321 |
* Normally, we block scripts with CSP. However, Mozilla does optimizations that |
| ... | ... | |
| 270 | 326 |
* applying this CSP to non-inline `<scripts>' in certain scenarios. |
| 271 | 327 |
*/ |
| 272 | 328 |
function prevent_script_execution(event) {
|
| 273 |
if (!event.target.haketilo_payload) |
|
| 274 |
event.preventDefault(); |
|
| 329 |
event.preventDefault(); |
|
| 275 | 330 |
} |
| 276 | 331 |
#ENDIF |
| 277 | 332 |
|
| ... | ... | |
| 285 | 340 |
* javascript execution. |
| 286 | 341 |
*/ |
| 287 | 342 |
async function sanitize_document(doc, policy) {
|
| 343 |
const root = doc.documentElement; |
|
| 344 |
const substitute_doc = |
|
| 345 |
new DOMParser().parseFromString("<!DOCTYPE html>", "text/html");
|
|
| 346 |
|
|
| 288 | 347 |
#IF MOZILLA |
| 289 | 348 |
/* |
| 290 | 349 |
* Blocking of scripts that are in the DOM from the beginning. Needed for |
| 291 | 350 |
* Mozilla. |
| 292 | 351 |
*/ |
| 293 | 352 |
const listener_args = ["beforescriptexecute", prevent_script_execution]; |
| 353 |
|
|
| 294 | 354 |
doc.addEventListener(...listener_args); |
| 355 |
substitute_doc.addEventListener(...listener_args); |
|
| 356 |
|
|
| 295 | 357 |
wait_loaded(doc).then(() => doc.removeEventListener(...listener_args)); |
| 296 | 358 |
|
| 297 | 359 |
sanitize_tree_urls(doc.documentElement); |
| 298 | 360 |
sanitize_tree_onevent(doc.documentElement); |
| 299 | 361 |
#ENDIF |
| 300 | 362 |
|
| 363 |
if (!doc.content_loaded) {
|
|
| 364 |
const sanitizer = new MOSanitizer(doc.documentElement); |
|
| 365 |
sanitizer.start(); |
|
| 366 |
wait_loaded(doc).then(() => sanitizer.stop()); |
|
| 367 |
} |
|
| 368 |
|
|
| 301 | 369 |
/* |
| 302 | 370 |
* Ensure our CSP rules are employed from the beginning. This CSP injection |
| 303 | 371 |
* method is, when possible, going to be applied together with CSP rules |
| ... | ... | |
| 322 | 390 |
* Root node gets hijacked now, to be re-attached after <head> is loaded |
| 323 | 391 |
* and sanitized. |
| 324 | 392 |
*/ |
| 325 |
const root = doc.documentElement; |
|
| 326 | 393 |
root.replaceWith(temporary_html); |
| 394 |
#IF MOZILLA |
|
| 395 |
/* |
|
| 396 |
* To be able to handle the onbeforescriptexecute event for scripts that |
|
| 397 |
* appear under detached document. |
|
| 398 |
*/ |
|
| 399 |
substitute_doc.documentElement.replaceWith(root); |
|
| 400 |
#ENDIF |
|
| 327 | 401 |
|
| 328 | 402 |
/* |
| 329 | 403 |
* When we don't inject payload, we neither block document's CSP `<meta>' |
| ... | ... | |
| 336 | 410 |
.forEach(m => sanitize_meta(m, policy)); |
| 337 | 411 |
} |
| 338 | 412 |
|
| 339 |
sanitize_tree_urls(root); |
|
| 340 |
root.querySelectorAll("script").forEach(s => sanitize_script(s, policy));
|
|
| 413 |
const scripts = [...root.getElementsByTagNameNS(html_ns, "script"), |
|
| 414 |
...root.getElementsByTagNameNS(svg_ns, "svg")]; |
|
| 415 |
scripts.forEach(s => sanitize_script(s, policy)); |
|
| 341 | 416 |
temporary_html.replaceWith(root); |
| 342 |
root.querySelectorAll("script").forEach(s => desanitize_script(s, policy));
|
|
| 343 |
#IF MOZILLA |
|
| 344 |
sanitize_tree_onevent(root); |
|
| 345 |
#ENDIF |
|
| 346 |
|
|
| 347 |
start_mo_sanitizing(doc); |
|
| 417 |
scripts.forEach(s => desanitize_script(s, policy)); |
|
| 348 | 418 |
} |
| 349 | 419 |
|
| 350 | 420 |
async function _disable_service_workers() {
|
| test/haketilo_test/data/pages/scripts_to_block_1.html | ||
|---|---|---|
| 29 | 29 |
</script> |
| 30 | 30 |
</head> |
| 31 | 31 |
<body> |
| 32 |
<button id="clickme1" |
|
| 33 |
onclick="window.__run = [...(window.__run || []), 'on'];" |
|
| 34 |
blocked-onclick="some useful data"> |
|
| 35 |
Click Meee! |
|
| 36 |
</button> |
|
| 37 |
<a id="clickme2" |
|
| 38 |
href="javascript:window.__run = [...(window.__run || []), 'href'];void(0);"> |
|
| 39 |
Click Meee! |
|
| 40 |
</a> |
|
| 41 |
<iframe src="javascript:void(window.parent.__run = [...(window.parent.__run || []), 'src']);"> |
|
| 42 |
</iframe> |
|
| 43 |
<object data="javascript:window.__run = [...(window.__run || []), 'data'];"> |
|
| 44 |
</object> |
|
| 32 |
<!-- |
|
| 33 |
Put all objects under a <div> to make sure the Mutation Observer does |
|
| 34 |
indeed correctly report changes in subtrees (there are problems with |
|
| 35 |
this in XML documents). |
|
| 36 |
--> |
|
| 37 |
<div> |
|
| 38 |
<button id="clickme1" |
|
| 39 |
onclick="window.__run = [...(window.__run || []), 'on'];" |
|
| 40 |
blocked-onclick="some useful data"> |
|
| 41 |
Click Meee! |
|
| 42 |
</button> |
|
| 43 |
<a id="clickme2" |
|
| 44 |
href="javascript:window.__run = [...(window.__run || []), 'href'];void(0);"> |
|
| 45 |
Click Meee! |
|
| 46 |
</a> |
|
| 47 |
<iframe src="javascript:void(window.parent.__run = [...(window.parent.__run || []), 'src']);"> |
|
| 48 |
</iframe> |
|
| 49 |
<object data="javascript:window.__run = [...(window.__run || []), 'data'];"> |
|
| 50 |
</object> |
|
| 51 |
</div> |
|
| 45 | 52 |
</body> |
| 46 | 53 |
</html> |
| test/haketilo_test/data/pages/scripts_to_block_2.xml | ||
|---|---|---|
| 1 |
<?xml version="1.0" encoding="UTF-8"?> |
|
| 2 |
<!-- |
|
| 3 |
SPDX-License-Identifier: CC0-1.0 |
|
| 4 |
|
|
| 5 |
A testing XML document with various scripts that need to get blocked. |
|
| 6 |
|
|
| 7 |
This file is part of Haketilo. |
|
| 8 |
|
|
| 9 |
Copyright (C) 2021, 2022 Wojtek Kosior <koszko@koszko.org> |
|
| 10 |
|
|
| 11 |
This program is free software: you can redistribute it and/or modify |
|
| 12 |
it under the terms of the CC0 1.0 Universal License as published by |
|
| 13 |
the Creative Commons Corporation. |
|
| 14 |
|
|
| 15 |
This program is distributed in the hope that it will be useful, |
|
| 16 |
but WITHOUT ANY WARRANTY; without even the implied warranty of |
|
| 17 |
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
|
| 18 |
CC0 1.0 Universal License for more details. |
|
| 19 |
--> |
|
| 20 |
|
|
| 21 |
<fruits> |
|
| 22 |
|
|
| 23 |
<!-- |
|
| 24 |
The following will not execute since it is not recognized as either HTML |
|
| 25 |
or SVG script. |
|
| 26 |
--> |
|
| 27 |
<script> |
|
| 28 |
window.__run = [...(window.__run || []), 'banana']; |
|
| 29 |
</script> |
|
| 30 |
|
|
| 31 |
<html:img xmlns:html="http://www.w3.org/1999/xhtml" |
|
| 32 |
src="" |
|
| 33 |
onload="window.__run = [...(window.__run || []), 'melon'];console.log('delme melon')">
|
|
| 34 |
</html:img> |
|
| 35 |
|
|
| 36 |
<!-- Will execute --> |
|
| 37 |
<html:script xmlns:html="http://www.w3.org/1999/xhtml"> |
|
| 38 |
window.__run = [...(window.__run || []), 'grape']; |
|
| 39 |
</html:script> |
|
| 40 |
|
|
| 41 |
<!-- Will also execute --> |
|
| 42 |
<vector-graphics:script xmlns:vector-graphics="http://www.w3.org/2000/svg"> |
|
| 43 |
window.__run = [...(window.__run || []), 'raspberry']; |
|
| 44 |
</vector-graphics:script> |
|
| 45 |
|
|
| 46 |
<apple> |
|
| 47 |
<svg viewBox="0 0 10 14" xmlns="http://www.w3.org/2000/svg"> |
|
| 48 |
<!-- Will run when clicked --> |
|
| 49 |
<circle id="idaret_circle" cx="5" cy="5" r="4" |
|
| 50 |
onclick="window.__run = [...(window.__run || []), 'idaret'];" /> |
|
| 51 |
<!-- Will *NOT* run when clicked --> |
|
| 52 |
<circle id="nowamak_circle" cx="5" cy="13" r="4" |
|
| 53 |
some-unknown:onclick="window.__run = [...(window.__run || []), 'nowamak'];" |
|
| 54 |
xmlns:some-unknown="https://example.org/blah/blah" /> |
|
| 55 |
</svg> |
|
| 56 |
</apple> |
|
| 57 |
<!-- |
|
| 58 |
In case of wrong namespace URI (or lack thereof), svg subtree will not |
|
| 59 |
be recognized as SVG at all |
|
| 60 |
--> |
|
| 61 |
<svg> |
|
| 62 |
<!-- Will neither run nor be drawn by the browser --> |
|
| 63 |
<circle id="mango_circle" cx="5" cy="5" r="4" |
|
| 64 |
onclick="window.__run = [...(window.__run || []), 'mango'];" /> |
|
| 65 |
</svg> |
|
| 66 |
<svg viewBox="0 0 10" xmlns="http://www.w3.org/2000/sv"> |
|
| 67 |
<!-- Will neither run nor be drawn by the browser --> |
|
| 68 |
<circle id="annoying_circle" cx="5" cy="5" r="4" |
|
| 69 |
onclick="window.__run = [...(window.__run || []), 'orange'];" /> |
|
| 70 |
</svg> |
|
| 71 |
</fruits> |
|
| test/haketilo_test/unit/test_policy_enforcing.py | ||
|---|---|---|
| 73 | 73 |
@pytest.mark.parametrize('csp_off_setting', [{}, {'csp_off': True}])
|
| 74 | 74 |
def test_policy_enforcing_html(driver, execute_in_page, csp_off_setting): |
| 75 | 75 |
""" |
| 76 |
A test case of sanitizing <script>s and intrinsic javascript in pages.
|
|
| 76 |
A test case of sanitizing <script>s and intrinsic JavaScript in HTML pages.
|
|
| 77 | 77 |
""" |
| 78 |
def assert_properly_blocked():
|
|
| 78 |
def click_all():
|
|
| 79 | 79 |
for i in range(1, 3): |
| 80 | 80 |
driver.find_element_by_id(f'clickme{i}').click()
|
| 81 | 81 |
|
| 82 |
def assert_properly_blocked(): |
|
| 83 |
click_all() |
|
| 84 |
|
|
| 82 | 85 |
assert set(driver.execute_script('return window.__run || [];')) == set()
|
| 83 | 86 |
assert bool(csp_off_setting) == are_scripts_allowed(driver) |
| 84 | 87 |
|
| ... | ... | |
| 98 | 101 |
**csp_off_setting |
| 99 | 102 |
}) |
| 100 | 103 |
|
| 101 |
for i in range(1, 3): |
|
| 102 |
driver.find_element_by_id(f'clickme{i}').click()
|
|
| 104 |
click_all() |
|
| 103 | 105 |
|
| 104 | 106 |
assert set(driver.execute_script('return window.__run || [];')) == \
|
| 105 | 107 |
{'inline', 'on', 'href', 'src', 'data'}
|
| ... | ... | |
| 121 | 123 |
|
| 122 | 124 |
assert_properly_blocked() |
| 123 | 125 |
assert are_scripts_allowed(driver, nonce) |
| 126 |
|
|
| 127 |
# Test function analogous to that for HTML page. |
|
| 128 |
@pytest.mark.ext_data({'content_script': content_script})
|
|
| 129 |
@pytest.mark.usefixtures('webextension')
|
|
| 130 |
@pytest.mark.parametrize('csp_off_setting', [{}, {'csp_off': True}])
|
|
| 131 |
def test_policy_enforcing_xml(driver, execute_in_page, csp_off_setting): |
|
| 132 |
""" |
|
| 133 |
A test case of sanitizing <script>s and intrinsic JavaScript in XML |
|
| 134 |
documents. |
|
| 135 |
""" |
|
| 136 |
def click_all(): |
|
| 137 |
for name in ('idaret', 'nowamak', 'mango', 'annoying'):
|
|
| 138 |
elem = driver.find_element_by_id(f'{name}_circle')
|
|
| 139 |
try: |
|
| 140 |
elem.click() |
|
| 141 |
except: |
|
| 142 |
pass |
|
| 143 |
|
|
| 144 |
def assert_properly_blocked(): |
|
| 145 |
click_all() |
|
| 146 |
|
|
| 147 |
try: |
|
| 148 |
assert set(driver.execute_script('return window.__run || [];')) == set()
|
|
| 149 |
except: |
|
| 150 |
from time import sleep |
|
| 151 |
sleep(100000) |
|
| 152 |
assert bool(csp_off_setting) == are_scripts_allowed(driver) |
|
| 153 |
|
|
| 154 |
# First, see if scripts run when not blocked. |
|
| 155 |
get(driver, 'https://gotmyowndoma.in/scripts_to_block_2.xml', {
|
|
| 156 |
'policy': allow_policy, |
|
| 157 |
**csp_off_setting |
|
| 158 |
}) |
|
| 159 |
|
|
| 160 |
click_all() |
|
| 161 |
|
|
| 162 |
assert set(driver.execute_script('return window.__run || [];')) == \
|
|
| 163 |
{'grape', 'raspberry', 'idaret', 'melon'}
|
|
| 164 |
assert are_scripts_allowed(driver) |
|
| 165 |
|
|
| 166 |
# Now, verify scripts don't run when blocked. |
|
| 167 |
get(driver, 'https://gotmyowndoma.in/scripts_to_block_2.xml', {
|
|
| 168 |
'policy': block_policy, |
|
| 169 |
**csp_off_setting |
|
| 170 |
}) |
|
| 171 |
|
|
| 172 |
assert_properly_blocked() |
|
| 173 |
|
|
| 174 |
# Now, verify only scripts with nonce can run when payload is injected. |
|
| 175 |
get(driver, 'https://gotmyowndoma.in/scripts_to_block_2.xml', {
|
|
| 176 |
'policy': payload_policy, |
|
| 177 |
**csp_off_setting |
|
| 178 |
}) |
|
| 179 |
|
|
| 180 |
assert_properly_blocked() |
|
| 181 |
assert are_scripts_allowed(driver, nonce) |
|
| test/haketilo_test/unit/utils.py | ||
|---|---|---|
| 228 | 228 |
return driver.execute_script( |
| 229 | 229 |
''' |
| 230 | 230 |
document.haketilo_scripts_allowed = false; |
| 231 |
const script = document.createElement("script");
|
|
| 231 |
const html_ns = "http://www.w3.org/1999/xhtml"; |
|
| 232 |
const script = document.createElementNS(html_ns, "script"); |
|
| 232 | 233 |
script.innerHTML = "document.haketilo_scripts_allowed = true;"; |
| 233 | 234 |
if (arguments[0]) |
| 234 | 235 |
script.setAttribute("nonce", arguments[0]);
|
| 235 |
document.head.append(script);
|
|
| 236 |
(document.head || document.documentElement).append(script);
|
|
| 236 | 237 |
return document.haketilo_scripts_allowed; |
| 237 | 238 |
''', |
| 238 | 239 |
nonce) |
| test/haketilo_test/world_wide_library.py | ||
|---|---|---|
| 234 | 234 |
|
| 235 | 235 |
'https://gotmyowndoma.in/scripts_to_block_1.html': |
| 236 | 236 |
(200, {}, here / 'data' / 'pages' / 'scripts_to_block_1.html'),
|
| 237 |
'https://gotmyowndoma.in/scripts_to_block_2.xml': |
|
| 238 |
(200, {}, here / 'data' / 'pages' / 'scripts_to_block_2.xml'),
|
|
| 237 | 239 |
|
| 238 | 240 |
'https://anotherdoma.in/resource/blocked/by/CORS.json': |
| 239 | 241 |
lambda command, get_params, post_params: (200, {}, some_data),
|
Also available in: Unified diff
improve script blocking in non-HTML documents (XML)