mirror of
https://github.com/gorhill/uBlock.git
synced 2024-11-17 16:02:33 +01:00
02b4d149e3
Related issue: - https://github.com/uBlockOrigin/uBlock-issues/issues/1341
1128 lines
37 KiB
JavaScript
1128 lines
37 KiB
JavaScript
/*******************************************************************************
|
|
|
|
uBlock Origin - a browser extension to block requests.
|
|
Copyright (C) 2014-present Raymond Hill
|
|
|
|
This program is free software: you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program. If not, see {http://www.gnu.org/licenses/}.
|
|
|
|
Home: https://github.com/gorhill/uBlock
|
|
*/
|
|
|
|
'use strict';
|
|
|
|
/******************************************************************************/
|
|
|
|
// Start isolation from global scope
|
|
|
|
µBlock.webRequest = (( ) => {
|
|
|
|
/******************************************************************************/
|
|
|
|
// Platform-specific behavior.
|
|
|
|
// https://github.com/uBlockOrigin/uBlock-issues/issues/42
|
|
// https://bugzilla.mozilla.org/show_bug.cgi?id=1376932
|
|
// Add proper version number detection once issue is fixed in Firefox.
|
|
let dontCacheResponseHeaders =
|
|
vAPI.webextFlavor.soup.has('firefox');
|
|
|
|
// https://github.com/gorhill/uMatrix/issues/967#issuecomment-373002011
|
|
// This can be removed once Firefox 60 ESR is released.
|
|
let cantMergeCSPHeaders =
|
|
vAPI.webextFlavor.soup.has('firefox') && vAPI.webextFlavor.major < 59;
|
|
|
|
|
|
// The real actual webextFlavor value may not be set in stone, so listen
|
|
// for possible future changes.
|
|
window.addEventListener('webextFlavor', function() {
|
|
dontCacheResponseHeaders =
|
|
vAPI.webextFlavor.soup.has('firefox');
|
|
cantMergeCSPHeaders =
|
|
vAPI.webextFlavor.soup.has('firefox') &&
|
|
vAPI.webextFlavor.major < 59;
|
|
}, { once: true });
|
|
|
|
/******************************************************************************/
|
|
|
|
// Intercept and filter web requests.
|
|
|
|
const onBeforeRequest = function(details) {
|
|
const fctxt = µBlock.filteringContext.fromWebrequestDetails(details);
|
|
|
|
// Special handling for root document.
|
|
// https://github.com/chrisaljoudi/uBlock/issues/1001
|
|
// This must be executed regardless of whether the request is
|
|
// behind-the-scene
|
|
if ( fctxt.itype === fctxt.MAIN_FRAME ) {
|
|
return onBeforeRootFrameRequest(fctxt);
|
|
}
|
|
|
|
// Special treatment: behind-the-scene requests
|
|
const tabId = details.tabId;
|
|
if ( tabId < 0 ) {
|
|
return onBeforeBehindTheSceneRequest(fctxt);
|
|
}
|
|
|
|
// Lookup the page store associated with this tab id.
|
|
const µb = µBlock;
|
|
let pageStore = µb.pageStoreFromTabId(tabId);
|
|
if ( pageStore === null ) {
|
|
const tabContext = µb.tabContextManager.mustLookup(tabId);
|
|
if ( tabContext.tabId < 0 ) {
|
|
return onBeforeBehindTheSceneRequest(fctxt);
|
|
}
|
|
vAPI.tabs.onNavigation({ tabId, frameId: 0, url: tabContext.rawURL });
|
|
pageStore = µb.pageStoreFromTabId(tabId);
|
|
}
|
|
|
|
const result = pageStore.filterRequest(fctxt);
|
|
|
|
pageStore.journalAddRequest(fctxt.getHostname(), result);
|
|
|
|
if ( µb.logger.enabled ) {
|
|
fctxt.setRealm('network').toLogger();
|
|
}
|
|
|
|
// Redirected
|
|
|
|
if ( fctxt.redirectURL !== undefined ) {
|
|
return { redirectUrl: fctxt.redirectURL };
|
|
}
|
|
|
|
// Not redirected
|
|
|
|
// Blocked
|
|
if ( result === 1 ) {
|
|
return { cancel: true };
|
|
}
|
|
|
|
// Not blocked
|
|
if (
|
|
fctxt.itype === fctxt.SUB_FRAME &&
|
|
details.parentFrameId !== -1 &&
|
|
details.aliasURL === undefined
|
|
) {
|
|
pageStore.setFrameURL(details.frameId, details.url);
|
|
}
|
|
|
|
if ( result === 2 ) {
|
|
return { cancel: false };
|
|
}
|
|
};
|
|
|
|
/******************************************************************************/
|
|
|
|
const onBeforeRootFrameRequest = function(fctxt) {
|
|
const µb = µBlock;
|
|
const requestURL = fctxt.url;
|
|
|
|
// Special handling for root document.
|
|
// https://github.com/chrisaljoudi/uBlock/issues/1001
|
|
// This must be executed regardless of whether the request is
|
|
// behind-the-scene
|
|
const requestHostname = fctxt.getHostname();
|
|
const loggerEnabled = µb.logger.enabled;
|
|
let result = 0;
|
|
let logData;
|
|
|
|
// If the site is whitelisted, disregard strict blocking
|
|
const trusted = µb.getNetFilteringSwitch(requestURL) === false;
|
|
if ( trusted ) {
|
|
result = 2;
|
|
if ( loggerEnabled ) {
|
|
logData = { engine: 'u', result: 2, raw: 'whitelisted' };
|
|
}
|
|
}
|
|
|
|
// Permanently unrestricted?
|
|
if (
|
|
result === 0 &&
|
|
µb.sessionSwitches.evaluateZ('no-strict-blocking', requestHostname)
|
|
) {
|
|
result = 2;
|
|
if ( loggerEnabled ) {
|
|
logData = {
|
|
engine: 'u',
|
|
result: 2,
|
|
raw: `no-strict-blocking: ${µb.sessionSwitches.z} true`
|
|
};
|
|
}
|
|
}
|
|
|
|
// Temporarily whitelisted?
|
|
if ( result === 0 && strictBlockBypasser.isBypassed(requestHostname) ) {
|
|
result = 2;
|
|
if ( loggerEnabled ) {
|
|
logData = {
|
|
engine: 'u',
|
|
result: 2,
|
|
raw: 'no-strict-blocking: true (temporary)'
|
|
};
|
|
}
|
|
}
|
|
|
|
// Static filtering: We always need the long-form result here.
|
|
const snfe = µb.staticNetFilteringEngine;
|
|
|
|
// Check for specific block
|
|
if ( result === 0 ) {
|
|
result = snfe.matchString(fctxt, 0b0001);
|
|
if ( result !== 0 || loggerEnabled ) {
|
|
logData = snfe.toLogData();
|
|
}
|
|
}
|
|
|
|
// Check for generic block
|
|
if ( result === 0 ) {
|
|
fctxt.type = 'no_type';
|
|
result = snfe.matchString(fctxt, 0b0001);
|
|
if ( result !== 0 || loggerEnabled ) {
|
|
logData = snfe.toLogData();
|
|
}
|
|
// https://github.com/chrisaljoudi/uBlock/issues/1128
|
|
// Do not block if the match begins after the hostname, except when
|
|
// the filter is specifically of type `other`.
|
|
// https://github.com/gorhill/uBlock/issues/490
|
|
// Removing this for the time being, will need a new, dedicated type.
|
|
if (
|
|
result === 1 &&
|
|
toBlockDocResult(requestURL, requestHostname, logData) === false
|
|
) {
|
|
result = 0;
|
|
logData = undefined;
|
|
}
|
|
fctxt.type = 'main_frame';
|
|
}
|
|
|
|
const pageStore = µb.bindTabToPageStats(fctxt.tabId, 'beforeRequest');
|
|
if ( pageStore !== null ) {
|
|
pageStore.journalAddRootFrame('uncommitted', requestURL);
|
|
pageStore.journalAddRequest(requestHostname, result);
|
|
}
|
|
|
|
if ( loggerEnabled ) {
|
|
fctxt.setFilter(logData);
|
|
}
|
|
|
|
// https://github.com/uBlockOrigin/uBlock-issues/issues/760
|
|
// Redirect non-blocked request?
|
|
if (
|
|
result !== 1 &&
|
|
trusted === false &&
|
|
pageStore !== null &&
|
|
snfe.hasQuery(fctxt)
|
|
) {
|
|
pageStore.redirectNonBlockedRequest(fctxt);
|
|
}
|
|
|
|
if ( loggerEnabled ) {
|
|
fctxt.setRealm('network').toLogger();
|
|
}
|
|
|
|
// Redirected
|
|
|
|
if ( fctxt.redirectURL !== undefined ) {
|
|
return { redirectUrl: fctxt.redirectURL };
|
|
}
|
|
|
|
// Not blocked
|
|
|
|
if ( result !== 1 ) { return; }
|
|
|
|
// No log data means no strict blocking (because we need to report why
|
|
// the blocking occurs.
|
|
if ( logData === undefined ) { return; }
|
|
|
|
// Blocked
|
|
|
|
const query = encodeURIComponent(JSON.stringify({
|
|
url: requestURL,
|
|
hn: requestHostname,
|
|
dn: fctxt.getDomain() || requestHostname,
|
|
fs: logData.raw
|
|
}));
|
|
|
|
vAPI.tabs.replace(
|
|
fctxt.tabId,
|
|
vAPI.getURL('document-blocked.html?details=') + query
|
|
);
|
|
|
|
return { cancel: true };
|
|
};
|
|
|
|
/******************************************************************************/
|
|
|
|
// https://github.com/gorhill/uBlock/issues/3208
|
|
// Mind case insensitivity.
|
|
// https://github.com/uBlockOrigin/uBlock-issues/issues/1147
|
|
// Do not strict-block if the filter pattern does not contain at least one
|
|
// token character.
|
|
const toBlockDocResult = function(url, hostname, logData) {
|
|
if ( typeof logData.regex !== 'string' ) { return false; }
|
|
if ( typeof logData.raw === 'string' && /\w/.test(logData.raw) === false ) {
|
|
return false;
|
|
}
|
|
const re = new RegExp(logData.regex, 'i');
|
|
const match = re.exec(url.toLowerCase());
|
|
if ( match === null ) { return false; }
|
|
|
|
// https://github.com/chrisaljoudi/uBlock/issues/1128
|
|
// https://github.com/chrisaljoudi/uBlock/issues/1212
|
|
// Verify that the end of the match is anchored to the end of the
|
|
// hostname.
|
|
// https://github.com/uBlockOrigin/uAssets/issues/7619#issuecomment-653010310
|
|
// Also match FQDN.
|
|
const hnpos = url.indexOf(hostname);
|
|
const hnlen = hostname.length;
|
|
const end = match.index + match[0].length - hnpos - hnlen;
|
|
return end === 0 || end === 1 ||
|
|
end === 2 && url.charCodeAt(hnpos + hnlen) === 0x2E /* '.' */;
|
|
};
|
|
|
|
/******************************************************************************/
|
|
|
|
// Intercept and filter behind-the-scene requests.
|
|
|
|
// https://github.com/gorhill/uBlock/issues/870
|
|
// Finally, Chromium 49+ gained the ability to report network request of type
|
|
// `beacon`, so now we can block them according to the state of the
|
|
// "Disable hyperlink auditing/beacon" setting.
|
|
|
|
const onBeforeBehindTheSceneRequest = function(fctxt) {
|
|
const µb = µBlock;
|
|
const pageStore = µb.pageStoreFromTabId(fctxt.tabId);
|
|
if ( pageStore === null ) { return; }
|
|
|
|
// https://bugs.chromium.org/p/chromium/issues/detail?id=637577#c15
|
|
// Do not filter behind-the-scene network request of type `beacon`: there
|
|
// is no point. In any case, this will become a non-issue once
|
|
// <https://bugs.chromium.org/p/chromium/issues/detail?id=522129> is
|
|
// fixed.
|
|
|
|
// Blocking behind-the-scene requests can break a lot of stuff: prevent
|
|
// browser updates, prevent extension updates, prevent extensions from
|
|
// working properly, etc.
|
|
// So we filter if and only if the "advanced user" mode is selected.
|
|
// https://github.com/gorhill/uBlock/issues/3150
|
|
// Ability to globally block CSP reports MUST also apply to
|
|
// behind-the-scene network requests.
|
|
|
|
// 2018-03-30:
|
|
// Filter all behind-the-scene network requests like any other network
|
|
// requests. Hopefully this will not break stuff as it used to be the
|
|
// case.
|
|
|
|
let result = 0;
|
|
|
|
// https://github.com/uBlockOrigin/uBlock-issues/issues/339
|
|
// Need to also test against `-scheme` since tabOrigin is normalized.
|
|
// Not especially elegant but for now this accomplishes the purpose of
|
|
// not dealing with network requests fired from a synthetic scope,
|
|
// that is unless advanced user mode is enabled.
|
|
|
|
if (
|
|
fctxt.tabOrigin.endsWith('-scheme') === false &&
|
|
µb.URI.isNetworkURI(fctxt.tabOrigin) ||
|
|
µb.userSettings.advancedUserEnabled ||
|
|
fctxt.itype === fctxt.CSP_REPORT
|
|
) {
|
|
result = pageStore.filterRequest(fctxt);
|
|
|
|
// The "any-tab" scope is not whitelist-able, and in such case we must
|
|
// use the origin URL as the scope. Most such requests aren't going to
|
|
// be blocked, so we further test for whitelisting and modify the
|
|
// result only when the request is being blocked.
|
|
if (
|
|
result === 1 &&
|
|
µb.getNetFilteringSwitch(fctxt.tabOrigin) === false
|
|
) {
|
|
result = 2;
|
|
fctxt.filter = { engine: 'u', result: 2, raw: 'whitelisted' };
|
|
}
|
|
}
|
|
|
|
if ( µb.logger.enabled ) {
|
|
fctxt.setRealm('network').toLogger();
|
|
}
|
|
|
|
// Redirected
|
|
|
|
if ( fctxt.redirectURL !== undefined ) {
|
|
return { redirectUrl: fctxt.redirectURL };
|
|
}
|
|
|
|
// Blocked?
|
|
|
|
if ( result === 1 ) {
|
|
return { cancel: true };
|
|
}
|
|
};
|
|
|
|
/******************************************************************************/
|
|
|
|
// https://github.com/gorhill/uBlock/issues/3140
|
|
|
|
const onBeforeMaybeSpuriousCSPReport = (function() {
|
|
let textDecoder;
|
|
|
|
return function(details) {
|
|
const fctxt = µBlock.filteringContext.fromWebrequestDetails(details);
|
|
|
|
// Ignore behind-the-scene requests.
|
|
if ( fctxt.tabId < 0 ) { return; }
|
|
|
|
// Lookup the page store associated with this tab id.
|
|
const pageStore = µBlock.pageStoreFromTabId(fctxt.tabId);
|
|
if ( pageStore === null ) { return; }
|
|
|
|
// If uBO is disabled for the page, it can't possibly causes CSP
|
|
// reports to be triggered.
|
|
if ( pageStore.getNetFilteringSwitch() === false ) { return; }
|
|
|
|
// A resource was redirected to a neutered one?
|
|
// TODO: mind injected scripts/styles as well.
|
|
if ( pageStore.internalRedirectionCount === 0 ) { return; }
|
|
|
|
if (
|
|
textDecoder === undefined &&
|
|
typeof self.TextDecoder === 'function'
|
|
) {
|
|
textDecoder = new TextDecoder();
|
|
}
|
|
|
|
// Find out whether the CSP report is a potentially spurious CSP report.
|
|
// If from this point on we are unable to parse the CSP report data,
|
|
// the safest assumption to protect users is to assume the CSP report
|
|
// is spurious.
|
|
if (
|
|
textDecoder !== undefined &&
|
|
details.method === 'POST'
|
|
) {
|
|
const raw = details.requestBody && details.requestBody.raw;
|
|
if (
|
|
Array.isArray(raw) &&
|
|
raw.length !== 0 &&
|
|
raw[0] instanceof Object &&
|
|
raw[0].bytes instanceof ArrayBuffer
|
|
) {
|
|
let data;
|
|
try {
|
|
data = JSON.parse(textDecoder.decode(raw[0].bytes));
|
|
} catch (ex) {
|
|
}
|
|
if ( data instanceof Object ) {
|
|
const report = data['csp-report'];
|
|
if ( report instanceof Object ) {
|
|
const blocked =
|
|
report['blocked-uri'] || report['blockedURI'];
|
|
const validBlocked = typeof blocked === 'string';
|
|
const source =
|
|
report['source-file'] || report['sourceFile'];
|
|
const validSource = typeof source === 'string';
|
|
if (
|
|
(validBlocked || validSource) &&
|
|
(!validBlocked || !blocked.startsWith('data')) &&
|
|
(!validSource || !source.startsWith('data'))
|
|
) {
|
|
return;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// At this point, we have a potentially spurious CSP report.
|
|
|
|
if ( µBlock.logger.enabled ) {
|
|
fctxt.setRealm('network')
|
|
.setType('csp_report')
|
|
.setFilter({ result: 1, source: 'global', raw: 'no-spurious-csp-report' })
|
|
.toLogger();
|
|
}
|
|
|
|
return { cancel: true };
|
|
};
|
|
})();
|
|
|
|
/******************************************************************************/
|
|
|
|
// To handle:
|
|
// - Media elements larger than n kB
|
|
// - Scriptlet injection (requires ability to modify response body)
|
|
// - HTML filtering (requires ability to modify response body)
|
|
// - CSP injection
|
|
|
|
const onHeadersReceived = function(details) {
|
|
// https://github.com/uBlockOrigin/uBlock-issues/issues/610
|
|
// Process behind-the-scene requests in a special way.
|
|
if (
|
|
details.tabId < 0 &&
|
|
normalizeBehindTheSceneResponseHeaders(details) === false
|
|
) {
|
|
return;
|
|
}
|
|
|
|
const µb = µBlock;
|
|
const fctxt = µb.filteringContext.fromWebrequestDetails(details);
|
|
const isRootDoc = fctxt.itype === fctxt.MAIN_FRAME;
|
|
|
|
let pageStore = µb.pageStoreFromTabId(fctxt.tabId);
|
|
if ( pageStore === null ) {
|
|
if ( isRootDoc === false ) { return; }
|
|
pageStore = µb.bindTabToPageStats(fctxt.tabId, 'beforeRequest');
|
|
}
|
|
if ( pageStore.getNetFilteringSwitch(fctxt) === false ) { return; }
|
|
|
|
if ( fctxt.itype === fctxt.IMAGE || fctxt.itype === fctxt.MEDIA ) {
|
|
return foilLargeMediaElement(details, fctxt, pageStore);
|
|
}
|
|
|
|
if ( isRootDoc === false && fctxt.itype !== fctxt.SUB_FRAME ) { return; }
|
|
|
|
// Keep in mind response headers will be modified in-place if needed, so
|
|
// `details.responseHeaders` will always point to the modified response
|
|
// headers.
|
|
const responseHeaders = details.responseHeaders;
|
|
|
|
// https://github.com/gorhill/uBlock/issues/2813
|
|
// Disable the blocking of large media elements if the document is itself
|
|
// a media element: the resource was not prevented from loading so no
|
|
// point to further block large media elements for the current document.
|
|
if ( isRootDoc ) {
|
|
const contentType = headerValueFromName('content-type', responseHeaders);
|
|
if ( reMediaContentTypes.test(contentType) ) {
|
|
pageStore.allowLargeMediaElementsUntil = 0;
|
|
return;
|
|
}
|
|
}
|
|
|
|
// At this point we have a HTML document.
|
|
|
|
const filteredHTML = µb.canFilterResponseData &&
|
|
filterDocument(pageStore, fctxt, details) === true;
|
|
|
|
let modifiedHeaders = injectCSP(fctxt, pageStore, responseHeaders) === true;
|
|
|
|
// https://bugzilla.mozilla.org/show_bug.cgi?id=1376932
|
|
// Prevent document from being cached by the browser if we modified it,
|
|
// either through HTML filtering and/or modified response headers.
|
|
// https://github.com/uBlockOrigin/uBlock-issues/issues/229
|
|
// Use `no-cache` instead of `no-cache, no-store, must-revalidate`, this
|
|
// allows Firefox's offline mode to work as expected.
|
|
if ( (filteredHTML || modifiedHeaders) && dontCacheResponseHeaders ) {
|
|
let cacheControl = µb.hiddenSettings.cacheControlForFirefox1376932;
|
|
if ( cacheControl !== 'unset' ) {
|
|
let i = headerIndexFromName('cache-control', responseHeaders);
|
|
if ( i !== -1 ) {
|
|
responseHeaders[i].value = cacheControl;
|
|
} else {
|
|
responseHeaders.push({ name: 'Cache-Control', value: cacheControl });
|
|
}
|
|
modifiedHeaders = true;
|
|
}
|
|
}
|
|
|
|
if ( modifiedHeaders ) {
|
|
return { responseHeaders: responseHeaders };
|
|
}
|
|
};
|
|
|
|
const reMediaContentTypes = /^(?:audio|image|video)\//;
|
|
|
|
/******************************************************************************/
|
|
|
|
// https://github.com/uBlockOrigin/uBlock-issues/issues/610
|
|
|
|
const normalizeBehindTheSceneResponseHeaders = function(details) {
|
|
if ( details.type !== 'xmlhttprequest' ) { return false; }
|
|
const headers = details.responseHeaders;
|
|
if ( Array.isArray(headers) === false ) { return false; }
|
|
const contentType = headerValueFromName('content-type', headers);
|
|
if ( contentType === '' ) { return false; }
|
|
if ( reMediaContentTypes.test(contentType) === false ) { return false; }
|
|
if ( contentType.startsWith('image') ) {
|
|
details.type = 'image';
|
|
} else {
|
|
details.type = 'media';
|
|
}
|
|
return true;
|
|
};
|
|
|
|
/*******************************************************************************
|
|
|
|
The response body filterer is responsible for:
|
|
|
|
- HTML filtering
|
|
|
|
In the spirit of efficiency, the response body filterer works this way:
|
|
|
|
If:
|
|
- HTML filtering: no.
|
|
Then:
|
|
No response body filtering is initiated.
|
|
|
|
If:
|
|
- HTML filtering: yes.
|
|
Then:
|
|
Assemble all response body data into a single buffer. Once all the
|
|
response data has been received, create a document from it. Then:
|
|
- Remove all DOM elements matching HTML filters.
|
|
Then serialize the resulting modified document as the new response
|
|
body.
|
|
|
|
**/
|
|
|
|
const filterDocument = (function() {
|
|
const µb = µBlock;
|
|
const filterers = new Map();
|
|
let domParser, xmlSerializer,
|
|
utf8TextDecoder, textDecoder, textEncoder;
|
|
|
|
const textDecode = function(encoding, buffer) {
|
|
if (
|
|
textDecoder !== undefined &&
|
|
textDecoder.encoding !== encoding
|
|
) {
|
|
textDecoder = undefined;
|
|
}
|
|
if ( textDecoder === undefined ) {
|
|
textDecoder = new TextDecoder(encoding);
|
|
}
|
|
return textDecoder.decode(buffer);
|
|
};
|
|
|
|
const reContentTypeDocument = /^(?:text\/html|application\/xhtml\+xml)/i;
|
|
const reContentTypeCharset = /charset=['"]?([^'" ]+)/i;
|
|
|
|
const mimeFromContentType = function(contentType) {
|
|
const match = reContentTypeDocument.exec(contentType);
|
|
if ( match !== null ) {
|
|
return match[0].toLowerCase();
|
|
}
|
|
};
|
|
|
|
const charsetFromContentType = function(contentType) {
|
|
const match = reContentTypeCharset.exec(contentType);
|
|
if ( match !== null ) {
|
|
return match[1].toLowerCase();
|
|
}
|
|
};
|
|
|
|
const charsetFromDoc = function(doc) {
|
|
let meta = doc.querySelector('meta[charset]');
|
|
if ( meta !== null ) {
|
|
return meta.getAttribute('charset').toLowerCase();
|
|
}
|
|
meta = doc.querySelector(
|
|
'meta[http-equiv="content-type" i][content]'
|
|
);
|
|
if ( meta !== null ) {
|
|
return charsetFromContentType(meta.getAttribute('content'));
|
|
}
|
|
};
|
|
|
|
const streamClose = function(filterer, buffer) {
|
|
if ( buffer !== undefined ) {
|
|
filterer.stream.write(buffer);
|
|
} else if ( filterer.buffer !== undefined ) {
|
|
filterer.stream.write(filterer.buffer);
|
|
}
|
|
filterer.stream.close();
|
|
};
|
|
|
|
const onStreamData = function(ev) {
|
|
const filterer = filterers.get(this);
|
|
if ( filterer === undefined ) {
|
|
this.write(ev.data);
|
|
this.disconnect();
|
|
return;
|
|
}
|
|
if (
|
|
this.status !== 'transferringdata' &&
|
|
this.status !== 'finishedtransferringdata'
|
|
) {
|
|
filterers.delete(this);
|
|
this.disconnect();
|
|
return;
|
|
}
|
|
// TODO:
|
|
// - Possibly improve buffer growth, if benchmarking shows it's worth
|
|
// it.
|
|
// - Also evaluate whether keeping a list of buffers and then decoding
|
|
// them in sequence using TextDecoder's "stream" option is more
|
|
// efficient. Can the data buffers be safely kept around for later
|
|
// use?
|
|
// - Informal, quick benchmarks seem to show most of the overhead is
|
|
// from calling TextDecoder.decode() and TextEncoder.encode(), and if
|
|
// confirmed, there is nothing which can be done uBO-side to reduce
|
|
// overhead.
|
|
if ( filterer.buffer === null ) {
|
|
filterer.buffer = new Uint8Array(ev.data);
|
|
return;
|
|
}
|
|
const buffer = new Uint8Array(
|
|
filterer.buffer.byteLength +
|
|
ev.data.byteLength
|
|
);
|
|
buffer.set(filterer.buffer);
|
|
buffer.set(new Uint8Array(ev.data), filterer.buffer.byteLength);
|
|
filterer.buffer = buffer;
|
|
};
|
|
|
|
const onStreamStop = function() {
|
|
const filterer = filterers.get(this);
|
|
filterers.delete(this);
|
|
if ( filterer === undefined || filterer.buffer === null ) {
|
|
this.close();
|
|
return;
|
|
}
|
|
if ( this.status !== 'finishedtransferringdata' ) { return; }
|
|
|
|
if ( domParser === undefined ) {
|
|
domParser = new DOMParser();
|
|
xmlSerializer = new XMLSerializer();
|
|
}
|
|
if ( textEncoder === undefined ) {
|
|
textEncoder = new TextEncoder();
|
|
}
|
|
|
|
let doc;
|
|
|
|
// If stream encoding is still unknnown, try to extract from document.
|
|
let charsetFound = filterer.charset,
|
|
charsetUsed = charsetFound;
|
|
if ( charsetFound === undefined ) {
|
|
if ( utf8TextDecoder === undefined ) {
|
|
utf8TextDecoder = new TextDecoder();
|
|
}
|
|
doc = domParser.parseFromString(
|
|
utf8TextDecoder.decode(filterer.buffer.slice(0, 1024)),
|
|
filterer.mime
|
|
);
|
|
charsetFound = charsetFromDoc(doc);
|
|
charsetUsed = µb.textEncode.normalizeCharset(charsetFound);
|
|
if ( charsetUsed === undefined ) {
|
|
return streamClose(filterer);
|
|
}
|
|
}
|
|
|
|
doc = domParser.parseFromString(
|
|
textDecode(charsetUsed, filterer.buffer),
|
|
filterer.mime
|
|
);
|
|
|
|
// https://github.com/gorhill/uBlock/issues/3507
|
|
// In case of no explicit charset found, try to find one again, but
|
|
// this time with the whole document parsed.
|
|
if ( charsetFound === undefined ) {
|
|
charsetFound = µb.textEncode.normalizeCharset(charsetFromDoc(doc));
|
|
if ( charsetFound !== charsetUsed ) {
|
|
if ( charsetFound === undefined ) {
|
|
return streamClose(filterer);
|
|
}
|
|
charsetUsed = charsetFound;
|
|
doc = domParser.parseFromString(
|
|
textDecode(charsetFound, filterer.buffer),
|
|
filterer.mime
|
|
);
|
|
}
|
|
}
|
|
|
|
let modified = false;
|
|
if ( filterer.selectors !== undefined ) {
|
|
if ( µb.htmlFilteringEngine.apply(doc, filterer) ) {
|
|
modified = true;
|
|
}
|
|
}
|
|
|
|
if ( modified === false ) {
|
|
return streamClose(filterer);
|
|
}
|
|
|
|
// https://stackoverflow.com/questions/6088972/get-doctype-of-an-html-as-string-with-javascript/10162353#10162353
|
|
const doctypeStr = doc.doctype instanceof Object ?
|
|
xmlSerializer.serializeToString(doc.doctype) + '\n' :
|
|
'';
|
|
|
|
// https://github.com/gorhill/uBlock/issues/3391
|
|
let encodedStream = textEncoder.encode(
|
|
doctypeStr +
|
|
doc.documentElement.outerHTML
|
|
);
|
|
if ( charsetUsed !== 'utf-8' ) {
|
|
encodedStream = µb.textEncode.encode(
|
|
charsetUsed,
|
|
encodedStream
|
|
);
|
|
}
|
|
|
|
streamClose(filterer, encodedStream);
|
|
};
|
|
|
|
const onStreamError = function() {
|
|
filterers.delete(this);
|
|
};
|
|
|
|
return function(pageStore, fctxt, extras) {
|
|
// https://github.com/gorhill/uBlock/issues/3478
|
|
const statusCode = extras.statusCode || 0;
|
|
if ( statusCode !== 0 && (statusCode < 200 || statusCode >= 300) ) {
|
|
return;
|
|
}
|
|
|
|
const hostname = fctxt.getHostname();
|
|
if ( hostname === '' ) { return; }
|
|
|
|
const domain = fctxt.getDomain();
|
|
|
|
const request = {
|
|
stream: undefined,
|
|
tabId: fctxt.tabId,
|
|
url: fctxt.url,
|
|
hostname: hostname,
|
|
domain: domain,
|
|
entity: µb.URI.entityFromDomain(domain),
|
|
selectors: undefined,
|
|
buffer: null,
|
|
mime: 'text/html',
|
|
charset: undefined
|
|
};
|
|
|
|
request.selectors = µb.htmlFilteringEngine.retrieve(request);
|
|
if ( request.selectors === undefined ) { return; }
|
|
|
|
const headers = extras.responseHeaders;
|
|
const contentType = headerValueFromName('content-type', headers);
|
|
if ( contentType !== '' ) {
|
|
request.mime = mimeFromContentType(contentType);
|
|
if ( request.mime === undefined ) { return; }
|
|
let charset = charsetFromContentType(contentType);
|
|
if ( charset !== undefined ) {
|
|
charset = µb.textEncode.normalizeCharset(charset);
|
|
if ( charset === undefined ) { return; }
|
|
request.charset = charset;
|
|
}
|
|
}
|
|
// https://bugzilla.mozilla.org/show_bug.cgi?id=1426789
|
|
if ( headerValueFromName('content-disposition', headers) ) { return; }
|
|
|
|
const stream = request.stream =
|
|
browser.webRequest.filterResponseData(extras.requestId);
|
|
stream.ondata = onStreamData;
|
|
stream.onstop = onStreamStop;
|
|
stream.onerror = onStreamError;
|
|
filterers.set(stream, request);
|
|
|
|
return true;
|
|
};
|
|
})();
|
|
|
|
/******************************************************************************/
|
|
|
|
const injectCSP = function(fctxt, pageStore, responseHeaders) {
|
|
const µb = µBlock;
|
|
const loggerEnabled = µb.logger.enabled;
|
|
const cspSubsets = [];
|
|
const requestType = fctxt.type;
|
|
|
|
// Start collecting policies >>>>>>>>
|
|
|
|
// ======== built-in policies
|
|
|
|
const builtinDirectives = [];
|
|
|
|
if ( pageStore.filterScripting(fctxt, true) === 1 ) {
|
|
builtinDirectives.push(µBlock.cspNoScripting);
|
|
if ( loggerEnabled ) {
|
|
fctxt.setRealm('network').setType('scripting').toLogger();
|
|
}
|
|
}
|
|
// https://github.com/uBlockOrigin/uBlock-issues/issues/422
|
|
// We need to derive a special context for filtering `inline-script`,
|
|
// as the embedding document for this "resource" will always be the
|
|
// frame itself, not that of the parent of the frame.
|
|
else {
|
|
const fctxt2 = fctxt.duplicate();
|
|
fctxt2.type = 'inline-script';
|
|
fctxt2.setDocOriginFromURL(fctxt.url);
|
|
const result = pageStore.filterRequest(fctxt2);
|
|
if ( result === 1 ) {
|
|
builtinDirectives.push(µBlock.cspNoInlineScript);
|
|
}
|
|
if ( result === 2 && loggerEnabled ) {
|
|
fctxt2.setRealm('network').toLogger();
|
|
}
|
|
}
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1539
|
|
// - Use a CSP to also forbid inline fonts if remote fonts are blocked.
|
|
fctxt.type = 'inline-font';
|
|
if ( pageStore.filterRequest(fctxt) === 1 ) {
|
|
builtinDirectives.push(µBlock.cspNoInlineFont);
|
|
if ( loggerEnabled ) {
|
|
fctxt.setRealm('network').toLogger();
|
|
}
|
|
}
|
|
|
|
if ( builtinDirectives.length !== 0 ) {
|
|
cspSubsets[0] = builtinDirectives.join(', ');
|
|
}
|
|
|
|
// ======== filter-based policies
|
|
|
|
// Static filtering.
|
|
|
|
fctxt.type = requestType;
|
|
const staticDirectives =
|
|
µb.staticNetFilteringEngine.matchAndFetchModifiers(fctxt, 'csp');
|
|
if ( staticDirectives !== undefined ) {
|
|
for ( const directive of staticDirectives ) {
|
|
if ( directive.result !== 1 ) { continue; }
|
|
cspSubsets.push(directive.modifier.value);
|
|
}
|
|
}
|
|
|
|
// URL filtering `allow` rules override static filtering.
|
|
if (
|
|
cspSubsets.length !== 0 &&
|
|
µb.sessionURLFiltering.evaluateZ(
|
|
fctxt.getTabHostname(),
|
|
fctxt.url,
|
|
'csp'
|
|
) === 2
|
|
) {
|
|
if ( loggerEnabled ) {
|
|
fctxt.setRealm('network')
|
|
.setType('csp')
|
|
.setFilter(µb.sessionURLFiltering.toLogData())
|
|
.toLogger();
|
|
}
|
|
return;
|
|
}
|
|
|
|
// Dynamic filtering `allow` rules override static filtering.
|
|
if (
|
|
cspSubsets.length !== 0 &&
|
|
µb.userSettings.advancedUserEnabled &&
|
|
µb.sessionFirewall.evaluateCellZY(
|
|
fctxt.getTabHostname(),
|
|
fctxt.getTabHostname(),
|
|
'*'
|
|
) === 2
|
|
) {
|
|
if ( loggerEnabled ) {
|
|
fctxt.setRealm('network')
|
|
.setType('csp')
|
|
.setFilter(µb.sessionFirewall.toLogData())
|
|
.toLogger();
|
|
}
|
|
return;
|
|
}
|
|
|
|
// <<<<<<<< All policies have been collected
|
|
|
|
// Static CSP policies will be applied.
|
|
|
|
if ( loggerEnabled && staticDirectives !== undefined ) {
|
|
fctxt.setRealm('network')
|
|
.pushFilters(staticDirectives.map(a => a.logData()))
|
|
.toLogger();
|
|
}
|
|
|
|
if ( cspSubsets.length === 0 ) { return; }
|
|
|
|
µb.updateToolbarIcon(fctxt.tabId, 0x02);
|
|
|
|
// Use comma to merge CSP directives.
|
|
// Ref.: https://www.w3.org/TR/CSP2/#implementation-considerations
|
|
//
|
|
// https://github.com/gorhill/uMatrix/issues/967
|
|
// Inject a new CSP header rather than modify an existing one, except
|
|
// if the current environment does not support merging headers:
|
|
// Firefox 58/webext and less can't merge CSP headers, so we will merge
|
|
// them here.
|
|
|
|
if ( cantMergeCSPHeaders ) {
|
|
const i = headerIndexFromName(
|
|
'content-security-policy',
|
|
responseHeaders
|
|
);
|
|
if ( i !== -1 ) {
|
|
cspSubsets.unshift(responseHeaders[i].value.trim());
|
|
responseHeaders.splice(i, 1);
|
|
}
|
|
}
|
|
|
|
responseHeaders.push({
|
|
name: 'Content-Security-Policy',
|
|
value: cspSubsets.join(', ')
|
|
});
|
|
|
|
return true;
|
|
};
|
|
|
|
/******************************************************************************/
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1163
|
|
// "Block elements by size".
|
|
// https://github.com/gorhill/uBlock/issues/1390#issuecomment-187310719
|
|
// Do not foil when the media element is fetched from the browser
|
|
// cache. This works only when the webext API supports the `fromCache`
|
|
// property (Firefox).
|
|
|
|
const foilLargeMediaElement = function(details, fctxt, pageStore) {
|
|
if ( details.fromCache === true ) { return; }
|
|
|
|
let size = 0;
|
|
if ( µBlock.userSettings.largeMediaSize !== 0 ) {
|
|
const headers = details.responseHeaders;
|
|
const i = headerIndexFromName('content-length', headers);
|
|
if ( i === -1 ) { return; }
|
|
size = parseInt(headers[i].value, 10) || 0;
|
|
}
|
|
|
|
const result = pageStore.filterLargeMediaElement(fctxt, size);
|
|
if ( result === 0 ) { return; }
|
|
|
|
if ( µBlock.logger.enabled ) {
|
|
fctxt.setRealm('network').toLogger();
|
|
}
|
|
|
|
return { cancel: true };
|
|
};
|
|
|
|
/******************************************************************************/
|
|
|
|
// Caller must ensure headerName is normalized to lower case.
|
|
|
|
const headerIndexFromName = function(headerName, headers) {
|
|
let i = headers.length;
|
|
while ( i-- ) {
|
|
if ( headers[i].name.toLowerCase() === headerName ) {
|
|
return i;
|
|
}
|
|
}
|
|
return -1;
|
|
};
|
|
|
|
const headerValueFromName = function(headerName, headers) {
|
|
const i = headerIndexFromName(headerName, headers);
|
|
return i !== -1 ? headers[i].value : '';
|
|
};
|
|
|
|
/******************************************************************************/
|
|
|
|
const strictBlockBypasser = {
|
|
hostnameToDeadlineMap: new Map(),
|
|
cleanupTimer: undefined,
|
|
|
|
cleanup: function() {
|
|
for ( const [ hostname, deadline ] of this.hostnameToDeadlineMap ) {
|
|
if ( deadline <= Date.now() ) {
|
|
this.hostnameToDeadlineMap.delete(hostname);
|
|
}
|
|
}
|
|
},
|
|
|
|
bypass: function(hostname) {
|
|
if ( typeof hostname !== 'string' || hostname === '' ) { return; }
|
|
this.hostnameToDeadlineMap.set(
|
|
hostname,
|
|
Date.now() + µBlock.hiddenSettings.strictBlockingBypassDuration * 1000
|
|
);
|
|
},
|
|
|
|
isBypassed: function(hostname) {
|
|
if ( this.hostnameToDeadlineMap.size === 0 ) { return false; }
|
|
let bypassDuration =
|
|
µBlock.hiddenSettings.strictBlockingBypassDuration * 1000;
|
|
if ( this.cleanupTimer === undefined ) {
|
|
this.cleanupTimer = vAPI.setTimeout(
|
|
( ) => {
|
|
this.cleanupTimer = undefined;
|
|
this.cleanup();
|
|
},
|
|
bypassDuration + 10000
|
|
);
|
|
}
|
|
for (;;) {
|
|
const deadline = this.hostnameToDeadlineMap.get(hostname);
|
|
if ( deadline !== undefined ) {
|
|
if ( deadline > Date.now() ) {
|
|
this.hostnameToDeadlineMap.set(
|
|
hostname,
|
|
Date.now() + bypassDuration
|
|
);
|
|
return true;
|
|
}
|
|
this.hostnameToDeadlineMap.delete(hostname);
|
|
}
|
|
const pos = hostname.indexOf('.');
|
|
if ( pos === -1 ) { break; }
|
|
hostname = hostname.slice(pos + 1);
|
|
}
|
|
return false;
|
|
}
|
|
};
|
|
|
|
/******************************************************************************/
|
|
|
|
return {
|
|
start: (( ) => {
|
|
vAPI.net = new vAPI.Net();
|
|
vAPI.net.suspend();
|
|
|
|
return function() {
|
|
vAPI.net.setSuspendableListener(onBeforeRequest);
|
|
vAPI.net.addListener(
|
|
'onHeadersReceived',
|
|
onHeadersReceived,
|
|
{
|
|
types: [
|
|
'main_frame',
|
|
'sub_frame',
|
|
'image',
|
|
'media',
|
|
'xmlhttprequest',
|
|
],
|
|
urls: [ 'http://*/*', 'https://*/*' ],
|
|
},
|
|
[ 'blocking', 'responseHeaders' ]
|
|
);
|
|
if ( vAPI.net.validTypes.has('csp_report') ) {
|
|
vAPI.net.addListener(
|
|
'onBeforeRequest',
|
|
onBeforeMaybeSpuriousCSPReport,
|
|
{
|
|
types: [ 'csp_report' ],
|
|
urls: [ 'http://*/*', 'https://*/*' ]
|
|
},
|
|
[ 'blocking', 'requestBody' ]
|
|
);
|
|
}
|
|
vAPI.net.unsuspend(true);
|
|
};
|
|
})(),
|
|
|
|
strictBlockBypass: function(hostname) {
|
|
strictBlockBypasser.bypass(hostname);
|
|
}
|
|
};
|
|
|
|
/******************************************************************************/
|
|
|
|
})();
|
|
|
|
/******************************************************************************/
|