2014-06-24 00:42:43 +02:00
|
|
|
|
/*******************************************************************************
|
|
|
|
|
|
2016-06-27 03:15:18 +02:00
|
|
|
|
uBlock Origin - a browser extension to block requests.
|
2017-05-12 16:35:11 +02:00
|
|
|
|
Copyright (C) 2014-2017 Raymond Hill
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
|
|
|
|
This program is free software: you can redistribute it and/or modify
|
|
|
|
|
it under the terms of the GNU General Public License as published by
|
|
|
|
|
the Free Software Foundation, either version 3 of the License, or
|
|
|
|
|
(at your option) any later version.
|
|
|
|
|
|
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
|
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
GNU General Public License for more details.
|
|
|
|
|
|
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
|
|
|
along with this program. If not, see {http://www.gnu.org/licenses/}.
|
|
|
|
|
|
|
|
|
|
Home: https://github.com/gorhill/uBlock
|
|
|
|
|
*/
|
|
|
|
|
|
2015-12-29 17:34:41 +01:00
|
|
|
|
/* jshint bitwise: false */
|
|
|
|
|
/* global punycode */
|
2014-10-19 17:10:31 +02:00
|
|
|
|
|
2016-06-27 03:15:18 +02:00
|
|
|
|
'use strict';
|
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2014-12-28 16:07:43 +01:00
|
|
|
|
µBlock.staticNetFilteringEngine = (function(){
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2014-09-14 22:20:40 +02:00
|
|
|
|
var µb = µBlock;
|
|
|
|
|
|
2014-07-14 17:24:59 +02:00
|
|
|
|
// fedcba9876543210
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// | | |||
|
|
|
|
|
// | | |||
|
|
|
|
|
// | | |||
|
|
|
|
|
// | | |||
|
|
|
|
|
// | | ||+---- bit 0: [BlockAction | AllowAction]
|
|
|
|
|
// | | |+---- bit 1: `important`
|
|
|
|
|
// | | +---- bit 2-3: party [0 - 3]
|
|
|
|
|
// | +---- bit 4-8: type [0 - 31]
|
|
|
|
|
// +---- bit 9-15: unused
|
2014-09-20 16:44:04 +02:00
|
|
|
|
|
2015-03-03 12:09:35 +01:00
|
|
|
|
var BlockAction = 0 << 0;
|
|
|
|
|
var AllowAction = 1 << 0;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var Important = 1 << 1;
|
|
|
|
|
var AnyParty = 0 << 2;
|
|
|
|
|
var FirstParty = 1 << 2;
|
|
|
|
|
var ThirdParty = 2 << 2;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
2015-03-26 00:28:22 +01:00
|
|
|
|
var AnyType = 0 << 4;
|
2014-09-21 02:06:55 +02:00
|
|
|
|
var typeNameToTypeValue = {
|
2016-08-31 11:19:16 +02:00
|
|
|
|
'no_type': 0 << 4,
|
2015-03-26 00:28:22 +01:00
|
|
|
|
'stylesheet': 1 << 4,
|
|
|
|
|
'image': 2 << 4,
|
|
|
|
|
'object': 3 << 4,
|
|
|
|
|
'script': 4 << 4,
|
|
|
|
|
'xmlhttprequest': 5 << 4,
|
|
|
|
|
'sub_frame': 6 << 4,
|
2015-04-05 16:38:47 +02:00
|
|
|
|
'font': 7 << 4,
|
2016-03-07 01:16:46 +01:00
|
|
|
|
'media': 8 << 4,
|
|
|
|
|
'websocket': 9 << 4,
|
|
|
|
|
'other': 10 << 4,
|
2017-05-12 16:35:11 +02:00
|
|
|
|
'popup': 11 << 4, // start of behavorial filtering
|
|
|
|
|
'popunder': 12 << 4,
|
|
|
|
|
'main_frame': 13 << 4, // start of 1st-party-only behavorial filtering
|
|
|
|
|
'generichide': 14 << 4,
|
|
|
|
|
'inline-script': 15 << 4,
|
|
|
|
|
'data': 16 << 4 // special: a generic data holder
|
2014-09-21 02:06:55 +02:00
|
|
|
|
};
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var otherTypeBitValue = typeNameToTypeValue.other;
|
2014-09-21 02:06:55 +02:00
|
|
|
|
|
2015-06-09 16:27:08 +02:00
|
|
|
|
var typeValueToTypeName = {
|
|
|
|
|
1: 'stylesheet',
|
|
|
|
|
2: 'image',
|
|
|
|
|
3: 'object',
|
|
|
|
|
4: 'script',
|
|
|
|
|
5: 'xmlhttprequest',
|
2015-07-13 14:49:58 +02:00
|
|
|
|
6: 'subdocument',
|
2015-06-09 16:27:08 +02:00
|
|
|
|
7: 'font',
|
2016-03-07 01:16:46 +01:00
|
|
|
|
8: 'media',
|
|
|
|
|
9: 'websocket',
|
|
|
|
|
10: 'other',
|
2017-05-12 16:35:11 +02:00
|
|
|
|
11: 'popup',
|
|
|
|
|
12: 'popunder',
|
|
|
|
|
13: 'document',
|
|
|
|
|
14: 'generichide',
|
|
|
|
|
15: 'inline-script',
|
|
|
|
|
16: 'data'
|
2015-06-09 16:27:08 +02:00
|
|
|
|
};
|
|
|
|
|
|
2015-02-08 05:42:07 +01:00
|
|
|
|
// All network request types to bitmap
|
|
|
|
|
// bring origin to 0 (from 4 -- see typeNameToTypeValue)
|
|
|
|
|
// left-shift 1 by the above-calculated value
|
2015-03-26 00:28:22 +01:00
|
|
|
|
// subtract 1 to set all type bits
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var allNetRequestTypesBitmap = (1 << (otherTypeBitValue >>> 4)) - 1;
|
2015-02-08 05:42:07 +01:00
|
|
|
|
|
2015-03-03 12:09:35 +01:00
|
|
|
|
var BlockAnyTypeAnyParty = BlockAction | AnyType | AnyParty;
|
|
|
|
|
var BlockAnyType = BlockAction | AnyType;
|
|
|
|
|
var BlockAnyParty = BlockAction | AnyParty;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
2015-03-03 12:09:35 +01:00
|
|
|
|
var AllowAnyTypeAnyParty = AllowAction | AnyType | AnyParty;
|
|
|
|
|
var AllowAnyType = AllowAction | AnyType;
|
|
|
|
|
var AllowAnyParty = AllowAction | AnyParty;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
2016-11-08 13:13:26 +01:00
|
|
|
|
var genericHideException = AllowAction | AnyParty | typeNameToTypeValue.generichide,
|
|
|
|
|
genericHideImportant = BlockAction | AnyParty | typeNameToTypeValue.generichide | Important;
|
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
// ABP filters: https://adblockplus.org/en/filters
|
|
|
|
|
// regex tester: http://regex101.com/
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
2014-09-21 20:03:41 +02:00
|
|
|
|
|
2015-02-05 00:06:31 +01:00
|
|
|
|
// See the following as short-lived registers, used during evaluation. They are
|
|
|
|
|
// valid until the next evaluation.
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var pageHostnameRegister = '',
|
|
|
|
|
requestHostnameRegister = '';
|
2015-03-30 23:42:12 +02:00
|
|
|
|
//var filterRegister = null;
|
|
|
|
|
//var categoryRegister = '';
|
2015-02-05 00:06:31 +01:00
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2014-09-21 20:03:41 +02:00
|
|
|
|
var histogram = function() {};
|
2014-06-24 00:42:43 +02:00
|
|
|
|
/*
|
2014-09-21 20:03:41 +02:00
|
|
|
|
histogram = function(label, categories) {
|
2014-06-24 00:42:43 +02:00
|
|
|
|
var h = [],
|
|
|
|
|
categoryBucket;
|
|
|
|
|
for ( var k in categories ) {
|
2014-09-21 15:40:54 +02:00
|
|
|
|
// No need for hasOwnProperty() here: there is no prototype chain.
|
2014-06-24 00:42:43 +02:00
|
|
|
|
categoryBucket = categories[k];
|
|
|
|
|
for ( var kk in categoryBucket ) {
|
2014-09-21 15:40:54 +02:00
|
|
|
|
// No need for hasOwnProperty() here: there is no prototype chain.
|
2014-06-24 00:42:43 +02:00
|
|
|
|
filterBucket = categoryBucket[kk];
|
|
|
|
|
h.push({
|
2014-09-21 20:03:41 +02:00
|
|
|
|
k: k.charCodeAt(0).toString(2) + ' ' + kk,
|
2014-06-24 00:42:43 +02:00
|
|
|
|
n: filterBucket instanceof FilterBucket ? filterBucket.filters.length : 1
|
|
|
|
|
});
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
console.log('Histogram %s', label);
|
|
|
|
|
|
|
|
|
|
var total = h.length;
|
|
|
|
|
h.sort(function(a, b) { return b.n - a.n; });
|
|
|
|
|
|
|
|
|
|
// Find indices of entries of interest
|
|
|
|
|
var target = 2;
|
|
|
|
|
for ( var i = 0; i < total; i++ ) {
|
|
|
|
|
if ( h[i].n === target ) {
|
|
|
|
|
console.log('\tEntries with only %d filter(s) start at index %s (key = "%s")', target, i, h[i].k);
|
|
|
|
|
target -= 1;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
h = h.slice(0, 50);
|
|
|
|
|
|
|
|
|
|
h.forEach(function(v) {
|
|
|
|
|
console.log('\tkey=%s count=%d', v.k, v.n);
|
|
|
|
|
});
|
|
|
|
|
console.log('\tTotal buckets count: %d', total);
|
|
|
|
|
};
|
|
|
|
|
*/
|
2014-09-08 23:46:58 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2015-06-09 23:01:31 +02:00
|
|
|
|
// Local helpers
|
|
|
|
|
|
2016-07-25 14:18:17 +02:00
|
|
|
|
// Be sure to not confuse 'example.com' with 'anotherexample.com'
|
2015-12-15 16:40:40 +01:00
|
|
|
|
var isFirstParty = function(domain, hostname) {
|
|
|
|
|
return hostname.endsWith(domain) &&
|
|
|
|
|
(hostname.length === domain.length ||
|
2017-05-12 16:35:11 +02:00
|
|
|
|
hostname.charCodeAt(hostname.length - domain.length - 1) === 0x2E /* '.' */);
|
2014-10-07 22:30:40 +02:00
|
|
|
|
};
|
|
|
|
|
|
2016-01-17 02:21:17 +01:00
|
|
|
|
var normalizeRegexSource = function(s) {
|
2015-10-26 16:23:56 +01:00
|
|
|
|
try {
|
2016-01-17 02:21:17 +01:00
|
|
|
|
var re = new RegExp(s);
|
|
|
|
|
return re.source;
|
2015-10-26 16:23:56 +01:00
|
|
|
|
} catch (ex) {
|
2016-01-17 02:21:17 +01:00
|
|
|
|
normalizeRegexSource.message = ex.toString();
|
2015-10-26 16:23:56 +01:00
|
|
|
|
}
|
2016-01-17 02:21:17 +01:00
|
|
|
|
return '';
|
2015-10-26 16:23:56 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var rawToRegexStr = function(s, anchor) {
|
|
|
|
|
var me = rawToRegexStr;
|
2015-07-04 23:34:18 +02:00
|
|
|
|
// https://www.loggly.com/blog/five-invaluable-techniques-to-improve-regex-performance/
|
2015-03-17 14:39:03 +01:00
|
|
|
|
// https://developer.mozilla.org/en/docs/Web/JavaScript/Guide/Regular_Expressions
|
2016-07-01 21:15:58 +02:00
|
|
|
|
// Also: remove leading/trailing wildcards -- there is no point.
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var reStr = s.replace(me.escape1, '\\$&')
|
|
|
|
|
.replace(me.escape2, '(?:[^%.0-9a-z_-]|$)')
|
|
|
|
|
.replace(me.escape3, '')
|
|
|
|
|
.replace(me.escape4, '[^ ]*?');
|
|
|
|
|
if ( anchor & 0x4 ) {
|
|
|
|
|
reStr = '[0-9a-z.-]*?' + reStr;
|
|
|
|
|
} else if ( anchor & 0x2 ) {
|
2015-03-05 01:36:09 +01:00
|
|
|
|
reStr = '^' + reStr;
|
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( anchor & 0x1 ) {
|
|
|
|
|
reStr += '$';
|
2016-08-23 16:33:28 +02:00
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return reStr;
|
2015-03-02 16:41:51 +01:00
|
|
|
|
};
|
2017-05-12 16:35:11 +02:00
|
|
|
|
rawToRegexStr.escape1 = /[.+?${}()|[\]\\]/g;
|
|
|
|
|
rawToRegexStr.escape2 = /\^/g;
|
|
|
|
|
rawToRegexStr.escape3 = /^\*|\*$/g;
|
|
|
|
|
rawToRegexStr.escape4 = /\*/g;
|
2015-03-02 16:41:51 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// If using native Map, we use numerical keys, otherwise for
|
|
|
|
|
// Object-based map we use string-based keys.
|
2017-05-19 14:45:19 +02:00
|
|
|
|
var exportInt = function(k) {
|
2017-05-16 16:25:00 +02:00
|
|
|
|
return k.toString(32);
|
|
|
|
|
};
|
2017-05-12 16:35:11 +02:00
|
|
|
|
|
2017-05-19 14:45:19 +02:00
|
|
|
|
var importInt = function(k) {
|
2017-05-16 16:25:00 +02:00
|
|
|
|
return parseInt(k,32);
|
|
|
|
|
};
|
2017-05-12 16:35:11 +02:00
|
|
|
|
|
2017-05-19 14:45:19 +02:00
|
|
|
|
var toLogDataInternal = function(categoryBits, tokenHash, filter) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( filter === null ) { return undefined; }
|
|
|
|
|
var logData = filter.logData();
|
2017-05-19 14:45:19 +02:00
|
|
|
|
logData.compiled = exportInt(categoryBits) + '\v' +
|
|
|
|
|
exportInt(tokenHash) + '\v' +
|
2017-05-12 16:35:11 +02:00
|
|
|
|
logData.compiled;
|
2017-05-19 14:45:19 +02:00
|
|
|
|
if ( categoryBits & 0x001 ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
logData.raw = '@@' + logData.raw;
|
|
|
|
|
}
|
|
|
|
|
var opts = [];
|
2017-05-19 14:45:19 +02:00
|
|
|
|
if ( categoryBits & 0x002 ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
opts.push('important');
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
if ( categoryBits & 0x008 ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
opts.push('third-party');
|
2017-05-19 14:45:19 +02:00
|
|
|
|
} else if ( categoryBits & 0x004 ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
opts.push('first-party');
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
var type = (categoryBits >>> 4) & 0x1F;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( type !== 0 && type !== 16 /* data */ ) {
|
|
|
|
|
opts.push(typeValueToTypeName[type]);
|
|
|
|
|
}
|
|
|
|
|
if ( logData.opts !== undefined ) {
|
|
|
|
|
opts.push(logData.opts);
|
|
|
|
|
}
|
|
|
|
|
if ( opts.length !== 0 ) {
|
|
|
|
|
logData.raw += '$' + opts.join(',');
|
|
|
|
|
}
|
|
|
|
|
return logData;
|
2015-06-09 23:01:31 +02:00
|
|
|
|
};
|
|
|
|
|
|
2016-08-23 16:33:28 +02:00
|
|
|
|
// First character of match must be within the hostname part of the url.
|
|
|
|
|
var isHnAnchored = function(url, matchStart) {
|
|
|
|
|
var hnStart = url.indexOf('://');
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( hnStart === -1 ) { return false; }
|
2016-08-23 16:33:28 +02:00
|
|
|
|
hnStart += 3;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( matchStart <= hnStart ) { return true; }
|
2016-08-23 16:33:28 +02:00
|
|
|
|
if ( reURLPostHostnameAnchors.test(url.slice(hnStart, matchStart)) ) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1929
|
|
|
|
|
// Match only hostname label boundaries.
|
|
|
|
|
return url.charCodeAt(matchStart - 1) === 0x2E;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
var reURLPostHostnameAnchors = /[\/?#]/;
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
/*******************************************************************************
|
2015-08-22 18:15:16 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
Each filter class will register itself in the map. A filter class
|
|
|
|
|
id MUST always stringify to ONE single character.
|
2015-08-22 18:15:16 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
IMPORTANT: any change which modifies the mapping will have to be
|
|
|
|
|
reflected with µBlock.systemSettings.compiledMagic.
|
2017-01-06 18:39:37 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
**/
|
2015-08-22 18:15:16 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var filterClasses = new Map(),
|
|
|
|
|
filterClassIdGenerator = 0;
|
2015-08-22 18:15:16 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var registerFilterClass = function(ctor) {
|
|
|
|
|
var fid = filterClassIdGenerator++;
|
|
|
|
|
ctor.fidPrefix = ctor.prototype.fidPrefix = fid.toString(32) + '\t';
|
|
|
|
|
filterClasses.set(fid, ctor);
|
|
|
|
|
//console.log(ctor.name, fid);
|
2015-08-22 18:15:16 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
/******************************************************************************/
|
2017-01-06 18:39:37 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterTrue = function() {
|
2015-08-22 03:52:16 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterTrue.prototype.match = function() {
|
|
|
|
|
return true;
|
2015-08-22 03:52:16 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterTrue.prototype.logData = function() {
|
|
|
|
|
return {
|
|
|
|
|
raw: '*',
|
|
|
|
|
regex: '^',
|
|
|
|
|
compiled: this.compile(),
|
|
|
|
|
};
|
2015-08-22 18:15:16 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterTrue.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix;
|
2015-08-22 18:15:16 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterTrue.compile = function() {
|
|
|
|
|
return FilterTrue.fidPrefix;
|
2015-08-22 18:15:16 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterTrue.load = function() {
|
|
|
|
|
return new FilterTrue();
|
|
|
|
|
};
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterTrue);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
var FilterPlain = function(s, tokenBeg) {
|
|
|
|
|
this.s = s;
|
|
|
|
|
this.tokenBeg = tokenBeg;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
FilterPlain.prototype.match = function(url, tokenBeg) {
|
2015-12-15 16:40:40 +01:00
|
|
|
|
return url.startsWith(this.s, tokenBeg - this.tokenBeg);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlain.prototype.logData = function() {
|
|
|
|
|
return {
|
|
|
|
|
raw: this.s,
|
|
|
|
|
regex: rawToRegexStr(this.s),
|
|
|
|
|
compiled: this.compile()
|
|
|
|
|
};
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlain.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.s + '\t' + this.tokenBeg;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlain.compile = function(details) {
|
|
|
|
|
return FilterPlain.fidPrefix + details.f + '\t' + details.tokenBeg;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlain.load = function(s) {
|
|
|
|
|
var pos = s.indexOf('\t', 2);
|
|
|
|
|
return new FilterPlain(
|
|
|
|
|
s.slice(2, pos),
|
|
|
|
|
parseInt(s.slice(pos + 1), 10)
|
|
|
|
|
);
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterPlain);
|
2014-09-08 23:46:58 +02:00
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
var FilterPlainPrefix0 = function(s) {
|
|
|
|
|
this.s = s;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
FilterPlainPrefix0.prototype.match = function(url, tokenBeg) {
|
2015-12-15 16:40:40 +01:00
|
|
|
|
return url.startsWith(this.s, tokenBeg);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainPrefix0.prototype.logData = function() {
|
|
|
|
|
return {
|
|
|
|
|
raw: this.s,
|
|
|
|
|
regex: rawToRegexStr(this.s),
|
|
|
|
|
compiled: this.compile()
|
|
|
|
|
};
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainPrefix0.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.s;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainPrefix0.compile = function(details) {
|
|
|
|
|
return FilterPlainPrefix0.fidPrefix + details.f;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainPrefix0.load = function(s) {
|
|
|
|
|
return new FilterPlainPrefix0(s.slice(2));
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterPlainPrefix0);
|
2014-09-08 23:46:58 +02:00
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
var FilterPlainPrefix1 = function(s) {
|
|
|
|
|
this.s = s;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
FilterPlainPrefix1.prototype.match = function(url, tokenBeg) {
|
2015-12-15 16:40:40 +01:00
|
|
|
|
return url.startsWith(this.s, tokenBeg - 1);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainPrefix1.prototype.logData = function() {
|
|
|
|
|
return {
|
|
|
|
|
raw: this.s,
|
|
|
|
|
regex: rawToRegexStr(this.s),
|
|
|
|
|
compiled: this.compile()
|
|
|
|
|
};
|
|
|
|
|
};
|
2014-09-08 23:46:58 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainPrefix1.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.s;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2015-02-24 00:31:29 +01:00
|
|
|
|
FilterPlainPrefix1.compile = function(details) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return FilterPlainPrefix1.fidPrefix + details.f;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainPrefix1.load = function(s) {
|
|
|
|
|
return new FilterPlainPrefix1(s.slice(2));
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterPlainPrefix1);
|
|
|
|
|
|
2014-08-28 15:59:05 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterPlainHostname = function(s) {
|
2014-06-24 00:42:43 +02:00
|
|
|
|
this.s = s;
|
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainHostname.prototype.match = function() {
|
|
|
|
|
var haystack = requestHostnameRegister, needle = this.s;
|
|
|
|
|
if ( haystack.endsWith(needle) === false ) { return false; }
|
|
|
|
|
var offset = haystack.length - needle.length;
|
|
|
|
|
return offset === 0 || haystack.charCodeAt(offset - 1) === 0x2E /* '.' */;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainHostname.prototype.logData = function() {
|
|
|
|
|
return {
|
|
|
|
|
raw: '||' + this.s + '^',
|
|
|
|
|
regex: rawToRegexStr(this.s, 0x4),
|
|
|
|
|
compiled: this.compile()
|
|
|
|
|
};
|
|
|
|
|
};
|
2014-08-28 15:59:05 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainHostname.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.s;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainHostname.compile = function(details) {
|
|
|
|
|
return FilterPlainHostname.fidPrefix + details.f;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainHostname.load = function(s) {
|
|
|
|
|
return new FilterPlainHostname(s.slice(2));
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterPlainHostname);
|
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
var FilterPlainLeftAnchored = function(s) {
|
|
|
|
|
this.s = s;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
FilterPlainLeftAnchored.prototype.match = function(url) {
|
2015-12-15 16:40:40 +01:00
|
|
|
|
return url.startsWith(this.s);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainLeftAnchored.prototype.logData = function() {
|
|
|
|
|
return {
|
|
|
|
|
raw: '|' + this.s,
|
|
|
|
|
regex: rawToRegexStr(this.s, 0x2),
|
|
|
|
|
compiled: this.compile()
|
|
|
|
|
};
|
|
|
|
|
};
|
2014-08-28 15:59:05 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainLeftAnchored.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.s;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2015-02-24 00:31:29 +01:00
|
|
|
|
FilterPlainLeftAnchored.compile = function(details) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return FilterPlainLeftAnchored.fidPrefix + details.f;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainLeftAnchored.load = function(s) {
|
|
|
|
|
return new FilterPlainLeftAnchored(s.slice(2));
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterPlainLeftAnchored);
|
|
|
|
|
|
2014-08-28 15:59:05 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterPlainRightAnchored = function(s) {
|
2014-06-24 00:42:43 +02:00
|
|
|
|
this.s = s;
|
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainRightAnchored.prototype.match = function(url) {
|
|
|
|
|
return url.endsWith(this.s);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainRightAnchored.prototype.logData = function() {
|
|
|
|
|
return {
|
|
|
|
|
raw: this.s + '|',
|
|
|
|
|
regex: rawToRegexStr(this.s, 0x1),
|
|
|
|
|
compiled: this.compile()
|
|
|
|
|
};
|
|
|
|
|
};
|
2014-08-28 15:59:05 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainRightAnchored.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.s;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainRightAnchored.compile = function(details) {
|
|
|
|
|
return FilterPlainRightAnchored.fidPrefix + details.f;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainRightAnchored.load = function(s) {
|
|
|
|
|
return new FilterPlainRightAnchored(s.slice(2));
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterPlainRightAnchored);
|
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterPlainHnAnchored = function(s) {
|
2014-06-24 00:42:43 +02:00
|
|
|
|
this.s = s;
|
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainHnAnchored.prototype.match = function(url, tokenBeg) {
|
|
|
|
|
return url.startsWith(this.s, tokenBeg) &&
|
|
|
|
|
isHnAnchored(url, tokenBeg);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainHnAnchored.prototype.logData = function() {
|
|
|
|
|
return {
|
|
|
|
|
raw: '||' + this.s,
|
|
|
|
|
regex: rawToRegexStr(this.s),
|
|
|
|
|
compiled: this.compile()
|
|
|
|
|
};
|
|
|
|
|
};
|
2014-08-28 15:59:05 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainHnAnchored.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.s;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainHnAnchored.compile = function(details) {
|
|
|
|
|
return FilterPlainHnAnchored.fidPrefix + details.f;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterPlainHnAnchored.load = function(s) {
|
|
|
|
|
return new FilterPlainHnAnchored(s.slice(2));
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterPlainHnAnchored);
|
|
|
|
|
|
2014-08-28 15:59:05 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterGeneric = function(s, anchor) {
|
2014-06-24 00:42:43 +02:00
|
|
|
|
this.s = s;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.anchor = anchor;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGeneric.prototype.re = null;
|
|
|
|
|
|
|
|
|
|
FilterGeneric.prototype.match = function(url) {
|
|
|
|
|
if ( this.re === null ) {
|
|
|
|
|
this.re = new RegExp(rawToRegexStr(this.s, this.anchor));
|
|
|
|
|
}
|
|
|
|
|
return this.re.test(url);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGeneric.prototype.logData = function() {
|
|
|
|
|
var out = {
|
|
|
|
|
raw: this.s,
|
|
|
|
|
regex: this.re.source,
|
|
|
|
|
compiled: this.compile()
|
|
|
|
|
};
|
|
|
|
|
if ( this.anchor & 0x2 ) {
|
|
|
|
|
out.raw = '|' + out.raw;
|
|
|
|
|
}
|
|
|
|
|
if ( this.anchor & 0x1 ) {
|
|
|
|
|
out.raw += '|';
|
|
|
|
|
}
|
|
|
|
|
return out;
|
|
|
|
|
};
|
2014-08-28 15:59:05 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGeneric.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.s + '\t' + this.anchor;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGeneric.compile = function(details) {
|
|
|
|
|
return FilterGeneric.fidPrefix + details.f + '\t' + details.anchor;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGeneric.load = function(s) {
|
|
|
|
|
var pos = s.indexOf('\t', 2);
|
|
|
|
|
return new FilterGeneric(
|
|
|
|
|
s.slice(2, pos),
|
|
|
|
|
parseInt(s.slice(pos + 1), 10)
|
|
|
|
|
);
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterGeneric);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
/******************************************************************************/
|
2014-09-19 16:59:44 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterGenericHnAnchored = function(s) {
|
2014-09-19 16:59:44 +02:00
|
|
|
|
this.s = s;
|
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGenericHnAnchored.prototype.re = null;
|
|
|
|
|
FilterGenericHnAnchored.prototype.anchor = 0x4;
|
|
|
|
|
|
|
|
|
|
FilterGenericHnAnchored.prototype.match = function(url) {
|
|
|
|
|
if ( this.re === null ) {
|
|
|
|
|
this.re = new RegExp(rawToRegexStr(this.s, this.anchor));
|
|
|
|
|
}
|
|
|
|
|
var matchStart = url.search(this.re);
|
|
|
|
|
return matchStart !== -1 && isHnAnchored(url, matchStart);
|
2014-09-19 16:59:44 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGenericHnAnchored.prototype.logData = function() {
|
|
|
|
|
var out = {
|
|
|
|
|
raw: '||' + this.s,
|
|
|
|
|
regex: this.re.source,
|
|
|
|
|
compiled: this.compile()
|
|
|
|
|
};
|
|
|
|
|
return out;
|
|
|
|
|
};
|
2014-09-19 16:59:44 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGenericHnAnchored.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.s;
|
2014-09-19 16:59:44 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGenericHnAnchored.compile = function(details) {
|
|
|
|
|
return FilterGenericHnAnchored.fidPrefix + details.f;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGenericHnAnchored.load = function(s) {
|
|
|
|
|
return new FilterGenericHnAnchored(s.slice(2));
|
2014-09-19 16:59:44 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterGenericHnAnchored);
|
2014-09-19 16:59:44 +02:00
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterGenericHnAndRightAnchored = function(s) {
|
|
|
|
|
FilterGenericHnAnchored.call(this, s);
|
2015-04-27 21:09:19 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGenericHnAndRightAnchored.prototype = Object.create(FilterGenericHnAnchored.prototype, {
|
|
|
|
|
constructor: {
|
|
|
|
|
value: FilterGenericHnAndRightAnchored
|
|
|
|
|
},
|
|
|
|
|
anchor: {
|
|
|
|
|
value: 0x5
|
|
|
|
|
},
|
|
|
|
|
logData: {
|
|
|
|
|
value: function() {
|
|
|
|
|
var out = FilterGenericHnAnchored.prototype.logData.call(this);
|
|
|
|
|
out.raw += '|';
|
|
|
|
|
return out;
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
compile: {
|
|
|
|
|
value: function() {
|
|
|
|
|
return this.fidPrefix + this.s;
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
});
|
2015-04-27 21:09:19 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGenericHnAndRightAnchored.compile = function(details) {
|
|
|
|
|
return FilterGenericHnAndRightAnchored.fidPrefix + details.f;
|
2015-04-27 21:09:19 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterGenericHnAndRightAnchored.load = function(s) {
|
|
|
|
|
return new FilterGenericHnAndRightAnchored(s.slice(2));
|
2015-04-27 21:09:19 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterGenericHnAndRightAnchored);
|
2015-04-27 21:09:19 +02:00
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterRegex = function(s) {
|
|
|
|
|
this.re = new RegExp(s, 'i');
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterRegex.prototype.match = function(url) {
|
2015-03-05 01:36:09 +01:00
|
|
|
|
return this.re.test(url);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterRegex.prototype.logData = function() {
|
|
|
|
|
return {
|
|
|
|
|
raw: '/' + this.s + '/',
|
|
|
|
|
regex: this.s,
|
|
|
|
|
compiled: this.compile()
|
|
|
|
|
};
|
|
|
|
|
};
|
2014-09-08 23:46:58 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterRegex.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.re.source;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterRegex.compile = function(details) {
|
|
|
|
|
return FilterRegex.fidPrefix + details.f;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterRegex.load = function(s) {
|
|
|
|
|
return new FilterRegex(s.slice(2));
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterRegex);
|
|
|
|
|
|
2014-09-08 23:46:58 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// Filtering according to the origin.
|
2014-08-28 15:59:05 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterOrigin = function() {
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOrigin.prototype.wrapped = {
|
|
|
|
|
compile: function() {
|
|
|
|
|
return '';
|
|
|
|
|
},
|
|
|
|
|
logData: function() {
|
|
|
|
|
return {
|
|
|
|
|
compiled: ''
|
|
|
|
|
};
|
|
|
|
|
},
|
|
|
|
|
match: function() {
|
|
|
|
|
return true;
|
|
|
|
|
}
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOrigin.prototype.matchOrigin = function() {
|
|
|
|
|
return true;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOrigin.prototype.match = function(url, tokenBeg) {
|
|
|
|
|
return this.matchOrigin() && this.wrapped.match(url, tokenBeg);
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOrigin.prototype.logData = function() {
|
|
|
|
|
var out = this.wrapped.logData(),
|
|
|
|
|
domainOpt = this.toDomainOpt();
|
|
|
|
|
out.compiled = this.fidPrefix + domainOpt + '\v' + out.compiled;
|
|
|
|
|
if ( out.opts === undefined ) {
|
|
|
|
|
out.opts = 'domain=' + domainOpt;
|
|
|
|
|
} else {
|
|
|
|
|
out.opts += ',domain=' + domainOpt;
|
|
|
|
|
}
|
|
|
|
|
return out;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOrigin.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.toDomainOpt() + '\v' + this.wrapped.compile();
|
|
|
|
|
};
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// *** start of specialized origin matchers
|
2015-03-02 16:41:51 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterOriginHit = function(domainOpt) {
|
|
|
|
|
FilterOrigin.call(this);
|
|
|
|
|
this.hostname = domainOpt;
|
2015-03-02 16:41:51 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOriginHit.prototype = Object.create(FilterOrigin.prototype, {
|
|
|
|
|
constructor: {
|
|
|
|
|
value: FilterOriginHit
|
|
|
|
|
},
|
|
|
|
|
toDomainOpt: {
|
|
|
|
|
value: function() {
|
|
|
|
|
return this.hostname;
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
matchOrigin: {
|
|
|
|
|
value: function() {
|
|
|
|
|
var needle = this.hostname, haystack = pageHostnameRegister;
|
|
|
|
|
if ( haystack.endsWith(needle) === false ) { return false; }
|
|
|
|
|
var offset = haystack.length - needle.length;
|
|
|
|
|
return offset === 0 || haystack.charCodeAt(offset - 1) === 0x2E /* '.' */;
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
});
|
2015-03-02 16:41:51 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
//
|
2015-03-02 16:41:51 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterOriginMiss = function(domainOpt) {
|
|
|
|
|
FilterOrigin.call(this);
|
|
|
|
|
this.hostname = domainOpt.slice(1);
|
2015-03-02 16:41:51 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOriginMiss.prototype = Object.create(FilterOrigin.prototype, {
|
|
|
|
|
constructor: {
|
|
|
|
|
value: FilterOriginMiss
|
|
|
|
|
},
|
|
|
|
|
toDomainOpt: {
|
|
|
|
|
value: function() {
|
|
|
|
|
return '~' + this.hostname;
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
matchOrigin: {
|
|
|
|
|
value: function() {
|
|
|
|
|
var needle = this.hostname, haystack = pageHostnameRegister;
|
|
|
|
|
if ( haystack.endsWith(needle) === false ) { return true; }
|
|
|
|
|
var offset = haystack.length - needle.length;
|
|
|
|
|
return offset !== 0 && haystack.charCodeAt(offset - 1) !== 0x2E /* '.' */;
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
});
|
2015-03-02 16:41:51 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
//
|
|
|
|
|
|
|
|
|
|
var FilterOriginHitSet = function(domainOpt) {
|
|
|
|
|
FilterOrigin.call(this);
|
|
|
|
|
this.domainOpt = domainOpt;
|
2015-03-02 16:41:51 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOriginHitSet.prototype = Object.create(FilterOrigin.prototype, {
|
|
|
|
|
constructor: {
|
|
|
|
|
value: FilterOriginHitSet
|
|
|
|
|
},
|
|
|
|
|
oneOf: {
|
|
|
|
|
value: null,
|
|
|
|
|
writable: true
|
|
|
|
|
},
|
|
|
|
|
toDomainOpt: {
|
|
|
|
|
value: function() {
|
|
|
|
|
return this.domainOpt;
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
matchOrigin: {
|
|
|
|
|
value: function() {
|
|
|
|
|
if ( this.oneOf === null ) {
|
|
|
|
|
this.oneOf = new RegExp('(?:^|\\.)(?:' + this.domainOpt.replace(/\./g, '\\.') + ')$');
|
|
|
|
|
}
|
|
|
|
|
return this.oneOf.test(pageHostnameRegister);
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
});
|
|
|
|
|
|
|
|
|
|
//
|
2015-03-02 16:41:51 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterOriginMissSet = function(domainOpt) {
|
|
|
|
|
FilterOrigin.call(this);
|
|
|
|
|
this.domainOpt = domainOpt;
|
2015-03-02 22:22:23 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOriginMissSet.prototype = Object.create(FilterOrigin.prototype, {
|
|
|
|
|
constructor: {
|
|
|
|
|
value: FilterOriginMissSet
|
|
|
|
|
},
|
|
|
|
|
noneOf: {
|
|
|
|
|
value: null,
|
|
|
|
|
writable: true
|
|
|
|
|
},
|
|
|
|
|
toDomainOpt: {
|
|
|
|
|
value: function() {
|
|
|
|
|
return this.domainOpt;
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
matchOrigin: {
|
|
|
|
|
value: function() {
|
|
|
|
|
if ( this.noneOf === null ) {
|
|
|
|
|
this.noneOf = new RegExp('(?:^|\\.)(?:' + this.domainOpt.replace(/~/g, '').replace(/\./g, '\\.') + ')$');
|
|
|
|
|
}
|
|
|
|
|
return this.noneOf.test(pageHostnameRegister) === false;
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
});
|
|
|
|
|
|
|
|
|
|
//
|
|
|
|
|
|
|
|
|
|
var FilterOriginMixedSet = function(domainOpt) {
|
|
|
|
|
FilterOrigin.call(this);
|
|
|
|
|
this.domainOpt = domainOpt;
|
2015-03-02 22:22:23 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOriginMixedSet.prototype = Object.create(FilterOrigin.prototype, {
|
|
|
|
|
constructor: {
|
|
|
|
|
value: FilterOriginMixedSet
|
|
|
|
|
},
|
|
|
|
|
oneOf: {
|
|
|
|
|
value: null,
|
|
|
|
|
writable: true
|
|
|
|
|
},
|
|
|
|
|
noneOf: {
|
|
|
|
|
value: null,
|
|
|
|
|
writable: true
|
|
|
|
|
},
|
|
|
|
|
init: {
|
|
|
|
|
value: function() {
|
|
|
|
|
var oneOf = [], noneOf = [],
|
|
|
|
|
hostnames = this.domainOpt.split('|'),
|
|
|
|
|
i = hostnames.length,
|
|
|
|
|
hostname;
|
|
|
|
|
while ( i-- ) {
|
|
|
|
|
hostname = hostnames[i].replace(/\./g, '\\.');
|
|
|
|
|
if ( hostname.charCodeAt(0) === 0x7E /* '~' */ ) {
|
|
|
|
|
noneOf.push(hostname.slice(1));
|
|
|
|
|
} else {
|
|
|
|
|
oneOf.push(hostname);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
this.oneOf = new RegExp('(?:^|\\.)(?:' + oneOf.join('|') + ')$');
|
|
|
|
|
this.noneOf = new RegExp('(?:^|\\.)(?:' + noneOf.join('|') + ')$');
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
toDomainOpt: {
|
|
|
|
|
value: function() {
|
|
|
|
|
return this.domainOpt;
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
matchOrigin: {
|
|
|
|
|
value: function() {
|
|
|
|
|
if ( this.oneOf === null ) { this.init(); }
|
|
|
|
|
var needle = pageHostnameRegister;
|
|
|
|
|
return this.oneOf.test(needle) && this.noneOf.test(needle) === false;
|
|
|
|
|
}
|
|
|
|
|
},
|
|
|
|
|
});
|
|
|
|
|
|
|
|
|
|
// *** end of specialized origin matchers
|
|
|
|
|
|
|
|
|
|
// The optimal test function is picked according to the content of the
|
|
|
|
|
// `domain=` filter option.
|
|
|
|
|
// Re-factored in light of:
|
|
|
|
|
// - https://gorhill.github.io/obj-vs-set-vs-map/set-vs-regexp.html
|
|
|
|
|
// The re-factoring made possible to reuse instances of a matcher. As of
|
|
|
|
|
// writing, I observed that just with EasyList, there were ~1,200 reused
|
|
|
|
|
// instances out of ~2,800.
|
2015-03-02 22:22:23 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOrigin.matcherFactory = function(domainOpt) {
|
|
|
|
|
// One hostname
|
|
|
|
|
if ( domainOpt.indexOf('|') === -1 ) {
|
|
|
|
|
if ( domainOpt.charCodeAt(0) === 0x7E /* '~' */ ) {
|
|
|
|
|
return new FilterOriginMiss(domainOpt);
|
|
|
|
|
}
|
|
|
|
|
return new FilterOriginHit(domainOpt);
|
|
|
|
|
}
|
|
|
|
|
// Many hostnames.
|
|
|
|
|
// Must be in set (none negated).
|
|
|
|
|
if ( domainOpt.indexOf('~') === -1 ) {
|
|
|
|
|
return new FilterOriginHitSet(domainOpt);
|
|
|
|
|
}
|
|
|
|
|
// Must not be in set (all negated).
|
|
|
|
|
if ( FilterOrigin.reAllNegated.test(domainOpt) ) {
|
|
|
|
|
return new FilterOriginMissSet(domainOpt);
|
|
|
|
|
}
|
|
|
|
|
// Must be in one set, but not in the other.
|
|
|
|
|
return new FilterOriginMixedSet(domainOpt);
|
2015-03-02 22:22:23 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOrigin.reAllNegated = /^~(?:[^|~]+\|~)+[^|~]+$/;
|
|
|
|
|
|
|
|
|
|
FilterOrigin.compile = function(details) {
|
|
|
|
|
return FilterOrigin.fidPrefix + details.domainOpt;
|
2015-03-02 22:22:23 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterOrigin.load = function(s) {
|
|
|
|
|
var pos = s.indexOf('\v', 2),
|
|
|
|
|
f = FilterOrigin.matcherFactory(s.slice(2, pos));
|
|
|
|
|
f.wrapped = filterFromCompiledData(s.slice(pos + 1));
|
|
|
|
|
return f;
|
2015-03-02 22:22:23 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterOrigin);
|
2015-03-02 22:22:23 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
/******************************************************************************/
|
2015-01-23 17:32:49 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var FilterDataHolder = function(dataType, dataStr) {
|
|
|
|
|
this.dataType = dataType;
|
|
|
|
|
this.dataStr = dataStr;
|
|
|
|
|
this.wrapped = undefined;
|
2015-01-23 17:32:49 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterDataHolder.prototype.match = function(url, tokenBeg) {
|
|
|
|
|
return this.wrapped.match(url, tokenBeg);
|
2015-01-23 17:32:49 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterDataHolder.prototype.logData = function() {
|
|
|
|
|
var out = this.wrapped.logData();
|
|
|
|
|
out.compiled = this.fidPrefix + this.dataType + '\t' + this.dataStr + '\v' + out.compiled;
|
|
|
|
|
var opt = this.dataType;
|
|
|
|
|
if ( this.dataStr !== '' ) {
|
|
|
|
|
opt += '=' + this.dataStr;
|
|
|
|
|
}
|
|
|
|
|
if ( out.opts === undefined ) {
|
|
|
|
|
out.opts = opt;
|
|
|
|
|
} else {
|
|
|
|
|
out.opts = opt + ',' + out.opts;
|
|
|
|
|
}
|
|
|
|
|
return out;
|
|
|
|
|
};
|
2015-01-23 17:32:49 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterDataHolder.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + this.dataType + '\t' + this.dataStr + '\v' + this.wrapped.compile();
|
2015-01-23 17:32:49 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterDataHolder.compile = function(details) {
|
|
|
|
|
return FilterDataHolder.fidPrefix + details.dataType + '\t' + details.dataStr;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterDataHolder.load = function(s) {
|
|
|
|
|
var pos = s.indexOf('\t', 2),
|
|
|
|
|
end = s.indexOf('\v', pos),
|
|
|
|
|
f = new FilterDataHolder(s.slice(2, pos), s.slice(pos + 1, end));
|
|
|
|
|
f.wrapped = filterFromCompiledData(s.slice(end + 1));
|
|
|
|
|
return f;
|
2015-01-23 17:32:49 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterDataHolder);
|
2015-01-23 17:32:49 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// Helper class for storing instances of FilterDataHolder.
|
2015-01-23 17:32:49 +01:00
|
|
|
|
|
2017-05-19 14:45:19 +02:00
|
|
|
|
var FilterDataHolderEntry = function(categoryBits, tokenHash, fdata) {
|
|
|
|
|
this.categoryBits = categoryBits;
|
|
|
|
|
this.tokenHash = tokenHash;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.filter = filterFromCompiledData(fdata);
|
|
|
|
|
this.next = undefined;
|
2015-01-23 17:32:49 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterDataHolderEntry.prototype.logData = function() {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
return toLogDataInternal(this.categoryBits, this.tokenHash, this.filter);
|
2015-02-24 00:31:29 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterDataHolderEntry.prototype.compile = function() {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
return exportInt(this.categoryBits) + '\t' +
|
|
|
|
|
exportInt(this.tokenHash) + '\t' +
|
|
|
|
|
this.filter.compile();
|
2015-01-23 17:32:49 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterDataHolderEntry.load = function(s) {
|
|
|
|
|
var pos1 = s.indexOf('\t'),
|
|
|
|
|
pos2 = s.indexOf('\t', pos1 + 1);
|
|
|
|
|
return new FilterDataHolderEntry(
|
2017-05-19 14:45:19 +02:00
|
|
|
|
importInt(s),
|
|
|
|
|
importInt(s.slice(pos1 + 1, pos2)),
|
2017-05-12 16:35:11 +02:00
|
|
|
|
s.slice(pos2 + 1)
|
|
|
|
|
);
|
2015-01-23 17:32:49 +01:00
|
|
|
|
};
|
|
|
|
|
|
2014-09-08 23:46:58 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2015-02-05 00:06:31 +01:00
|
|
|
|
// Dictionary of hostnames
|
2015-02-05 14:45:29 +01:00
|
|
|
|
//
|
2015-02-05 00:06:31 +01:00
|
|
|
|
var FilterHostnameDict = function() {
|
|
|
|
|
this.h = ''; // short-lived register
|
2016-09-12 16:22:25 +02:00
|
|
|
|
this.dict = new Set();
|
2015-02-05 00:06:31 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-03-20 20:54:41 +01:00
|
|
|
|
Object.defineProperty(FilterHostnameDict.prototype, 'size', {
|
|
|
|
|
get: function() {
|
|
|
|
|
return this.dict.size;
|
|
|
|
|
}
|
|
|
|
|
});
|
|
|
|
|
|
2015-02-05 00:06:31 +01:00
|
|
|
|
FilterHostnameDict.prototype.add = function(hn) {
|
2016-09-12 16:22:25 +02:00
|
|
|
|
if ( this.dict.has(hn) ) {
|
2015-02-24 00:31:29 +01:00
|
|
|
|
return false;
|
2015-02-05 00:06:31 +01:00
|
|
|
|
}
|
2016-09-12 16:22:25 +02:00
|
|
|
|
this.dict.add(hn);
|
2015-02-24 00:31:29 +01:00
|
|
|
|
return true;
|
2015-02-05 00:06:31 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-03-20 20:54:41 +01:00
|
|
|
|
FilterHostnameDict.prototype.remove = function(hn) {
|
|
|
|
|
return this.dict.delete(hn);
|
|
|
|
|
};
|
|
|
|
|
|
2015-02-24 00:31:29 +01:00
|
|
|
|
FilterHostnameDict.prototype.match = function() {
|
2015-02-05 00:06:31 +01:00
|
|
|
|
// TODO: mind IP addresses
|
|
|
|
|
var pos,
|
|
|
|
|
hostname = requestHostnameRegister;
|
2016-09-12 16:22:25 +02:00
|
|
|
|
while ( this.dict.has(hostname) === false ) {
|
2015-02-05 00:06:31 +01:00
|
|
|
|
pos = hostname.indexOf('.');
|
|
|
|
|
if ( pos === -1 ) {
|
|
|
|
|
this.h = '';
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
hostname = hostname.slice(pos + 1);
|
|
|
|
|
}
|
2015-06-09 16:27:08 +02:00
|
|
|
|
this.h = hostname;
|
2015-02-05 00:06:31 +01:00
|
|
|
|
return this;
|
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterHostnameDict.prototype.logData = function() {
|
|
|
|
|
return {
|
|
|
|
|
raw: '||' + this.h + '^',
|
|
|
|
|
regex: rawToRegexStr(this.h) + '(?:[^%.0-9a-z_-]|$)',
|
|
|
|
|
compiled: this.h
|
|
|
|
|
};
|
2015-02-05 00:06:31 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterHostnameDict.prototype.compile = function() {
|
|
|
|
|
return this.fidPrefix + JSON.stringify(µb.setToArray(this.dict));
|
2015-02-05 00:06:31 +01:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterHostnameDict.load = function(s) {
|
2015-02-05 00:06:31 +01:00
|
|
|
|
var f = new FilterHostnameDict();
|
2017-05-12 16:35:11 +02:00
|
|
|
|
f.dict = µb.setFromArray(JSON.parse(s.slice(2)));
|
2015-02-05 00:06:31 +01:00
|
|
|
|
return f;
|
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterHostnameDict);
|
|
|
|
|
|
2015-02-05 00:06:31 +01:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2014-09-22 02:26:16 +02:00
|
|
|
|
// Some buckets can grow quite large, and finding a hit in these buckets
|
|
|
|
|
// may end up being expensive. After considering various solutions, the one
|
2014-10-17 21:44:19 +02:00
|
|
|
|
// retained is to promote hit filters to a smaller index, so that next time
|
2014-09-22 02:26:16 +02:00
|
|
|
|
// they can be looked-up faster.
|
2014-09-19 16:59:44 +02:00
|
|
|
|
|
2014-09-21 20:03:41 +02:00
|
|
|
|
// key= 10000 ad count=660
|
|
|
|
|
// key= 10000 ads count=433
|
|
|
|
|
// key= 10001 google count=277
|
|
|
|
|
// key=1000000 2mdn count=267
|
|
|
|
|
// key= 10000 social count=240
|
|
|
|
|
// key= 10001 pagead2 count=166
|
|
|
|
|
// key= 10000 twitter count=122
|
|
|
|
|
// key= 10000 doubleclick count=118
|
|
|
|
|
// key= 10000 facebook count=114
|
|
|
|
|
// key= 10000 share count=113
|
|
|
|
|
// key= 10000 google count=106
|
|
|
|
|
// key= 10001 code count=103
|
|
|
|
|
// key= 11000 doubleclick count=100
|
|
|
|
|
// key=1010001 g count=100
|
|
|
|
|
// key= 10001 js count= 89
|
|
|
|
|
// key= 10000 adv count= 88
|
|
|
|
|
// key= 10000 youtube count= 61
|
|
|
|
|
// key= 10000 plugins count= 60
|
|
|
|
|
// key= 10001 partner count= 59
|
|
|
|
|
// key= 10000 ico count= 57
|
|
|
|
|
// key= 110001 ssl count= 57
|
|
|
|
|
// key= 10000 banner count= 53
|
|
|
|
|
// key= 10000 footer count= 51
|
|
|
|
|
// key= 10000 rss count= 51
|
2014-09-19 16:59:44 +02:00
|
|
|
|
|
2014-09-22 02:26:16 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2014-09-08 23:46:58 +02:00
|
|
|
|
var FilterBucket = function(a, b) {
|
2014-09-22 02:26:16 +02:00
|
|
|
|
this.promoted = 0;
|
|
|
|
|
this.vip = 16;
|
2014-10-06 20:02:44 +02:00
|
|
|
|
this.f = null; // short-lived register
|
2014-09-08 23:46:58 +02:00
|
|
|
|
this.filters = [];
|
|
|
|
|
if ( a !== undefined ) {
|
|
|
|
|
this.filters[0] = a;
|
|
|
|
|
if ( b !== undefined ) {
|
|
|
|
|
this.filters[1] = b;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
FilterBucket.prototype.add = function(a) {
|
|
|
|
|
this.filters.push(a);
|
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterBucket.prototype.remove = function(fdata) {
|
2017-03-11 19:55:47 +01:00
|
|
|
|
var i = this.filters.length,
|
|
|
|
|
filter;
|
|
|
|
|
while ( i-- ) {
|
|
|
|
|
filter = this.filters[i];
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( filter.compile() === fdata ) {
|
2017-03-11 19:55:47 +01:00
|
|
|
|
this.filters.splice(i, 1);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
2014-09-22 02:26:16 +02:00
|
|
|
|
// Promote hit filters so they can be found faster next time.
|
|
|
|
|
FilterBucket.prototype.promote = function(i) {
|
|
|
|
|
var filters = this.filters;
|
|
|
|
|
var pivot = filters.length >>> 1;
|
|
|
|
|
while ( i < pivot ) {
|
|
|
|
|
pivot >>>= 1;
|
|
|
|
|
if ( pivot < this.vip ) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( i <= pivot ) { return; }
|
2014-09-22 02:26:16 +02:00
|
|
|
|
var j = this.promoted % pivot;
|
|
|
|
|
//console.debug('FilterBucket.promote(): promoted %d to %d', i, j);
|
|
|
|
|
var f = filters[j];
|
|
|
|
|
filters[j] = filters[i];
|
|
|
|
|
filters[i] = f;
|
|
|
|
|
this.promoted += 1;
|
|
|
|
|
};
|
|
|
|
|
|
2014-09-08 23:46:58 +02:00
|
|
|
|
FilterBucket.prototype.match = function(url, tokenBeg) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var filters = this.filters,
|
|
|
|
|
n = filters.length;
|
2014-09-22 02:26:16 +02:00
|
|
|
|
for ( var i = 0; i < n; i++ ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( filters[i].match(url, tokenBeg) ) {
|
2014-09-08 23:46:58 +02:00
|
|
|
|
this.f = filters[i];
|
2014-09-22 02:26:16 +02:00
|
|
|
|
if ( i >= this.vip ) {
|
|
|
|
|
this.promote(i);
|
|
|
|
|
}
|
2014-09-08 23:46:58 +02:00
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return false;
|
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterBucket.prototype.logData = function() {
|
|
|
|
|
return this.f.logData();
|
|
|
|
|
};
|
2014-09-08 23:46:58 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterBucket.prototype.compile = function() {
|
|
|
|
|
var compiled = [],
|
|
|
|
|
filters = this.filters;
|
|
|
|
|
for ( var i = 0, n = filters.length; i < n; i++ ) {
|
|
|
|
|
compiled[i] = filters[i].compile();
|
|
|
|
|
}
|
|
|
|
|
return this.fidPrefix + JSON.stringify(compiled);
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterBucket.load = function(s) {
|
|
|
|
|
var f = new FilterBucket(),
|
|
|
|
|
compiled = JSON.parse(s.slice(2)),
|
|
|
|
|
filters = f.filters;
|
|
|
|
|
for ( var i = 0, n = compiled.length; i < n; i++ ) {
|
|
|
|
|
filters[i] = filterFromCompiledData(compiled[i]);
|
|
|
|
|
}
|
|
|
|
|
return f;
|
2015-06-09 16:27:08 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
registerFilterClass(FilterBucket);
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
var filterFromCompiledData = function(compiled) {
|
|
|
|
|
if ( compiled === lastLoadedFilterString ) {
|
|
|
|
|
return lastLoadedFilter;
|
|
|
|
|
}
|
|
|
|
|
var fid = parseInt(compiled, 36),
|
|
|
|
|
f = filterClasses.get(fid).load(compiled);
|
|
|
|
|
//filterClassHistogram.set(fid, (filterClassHistogram.get(fid) || 0) + 1);
|
|
|
|
|
lastLoadedFilterString = compiled;
|
|
|
|
|
lastLoadedFilter = f;
|
|
|
|
|
return f;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var lastLoadedFilterString,
|
|
|
|
|
lastLoadedFilter;
|
|
|
|
|
//var filterClassHistogram = new Map();
|
|
|
|
|
|
2014-09-08 23:46:58 +02:00
|
|
|
|
/******************************************************************************/
|
2014-06-24 00:42:43 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
var FilterParser = function() {
|
2016-08-31 01:57:25 +02:00
|
|
|
|
this.cantWebsocket = vAPI.cantWebsocket;
|
2017-01-09 14:56:42 +01:00
|
|
|
|
this.reBadDomainOptChars = /[*+?^${}()[\]\\]/;
|
2016-03-12 07:25:02 +01:00
|
|
|
|
this.reHostnameRule1 = /^[0-9a-z][0-9a-z.-]*[0-9a-z]$/i;
|
|
|
|
|
this.reHostnameRule2 = /^\**[0-9a-z][0-9a-z.-]*[0-9a-z]\^?$/i;
|
2015-12-13 18:55:55 +01:00
|
|
|
|
this.reCleanupHostnameRule2 = /^\**|\^$/g;
|
2015-01-23 17:32:49 +01:00
|
|
|
|
this.reHasWildcard = /[\^\*]/;
|
2015-12-13 17:03:13 +01:00
|
|
|
|
this.reCanTrimCarets1 = /^[^*]*$/;
|
|
|
|
|
this.reCanTrimCarets2 = /^\^?[^^]+[^^][^^]+\^?$/;
|
2015-01-23 17:32:49 +01:00
|
|
|
|
this.reHasUppercase = /[A-Z]/;
|
2015-12-13 18:55:55 +01:00
|
|
|
|
this.reIsolateHostname = /^(\*?\.)?([^\x00-\x24\x26-\x2C\x2F\x3A-\x5E\x60\x7B-\x7F]+)(.*)/;
|
2015-02-27 00:08:42 +01:00
|
|
|
|
this.reHasUnicode = /[^\x00-\x7F]/;
|
2016-09-06 00:56:35 +02:00
|
|
|
|
this.reWebsocketAny = /^ws[s*]?(?::\/?\/?)?\*?$/;
|
2017-05-16 18:44:12 +02:00
|
|
|
|
this.reBadCSP = /(?:^|;)\s*report-(?:to|uri)\b/;
|
2015-08-22 18:15:16 +02:00
|
|
|
|
this.domainOpt = '';
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.noTokenHash = µb.urlTokenizer.tokenHashFromString('*');
|
2014-08-28 15:59:05 +02:00
|
|
|
|
this.reset();
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2016-11-06 16:49:02 +01:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1493
|
|
|
|
|
// Transpose `ping` into `other` for now.
|
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
FilterParser.prototype.toNormalizedType = {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
'beacon': 'other',
|
|
|
|
|
'data': 'data',
|
|
|
|
|
'document': 'main_frame',
|
|
|
|
|
'elemhide': 'generichide',
|
2015-04-05 16:38:47 +02:00
|
|
|
|
'font': 'font',
|
2017-05-12 16:35:11 +02:00
|
|
|
|
'generichide': 'generichide',
|
|
|
|
|
'image': 'image',
|
|
|
|
|
'inline-script': 'inline-script',
|
2016-03-07 01:16:46 +01:00
|
|
|
|
'media': 'media',
|
2017-05-12 16:35:11 +02:00
|
|
|
|
'object': 'object',
|
2014-07-14 17:24:59 +02:00
|
|
|
|
'other': 'other',
|
2017-05-12 16:35:11 +02:00
|
|
|
|
'object-subrequest': 'object',
|
2016-11-06 16:49:02 +01:00
|
|
|
|
'ping': 'other',
|
2015-12-04 17:15:09 +01:00
|
|
|
|
'popunder': 'popunder',
|
2017-05-12 16:35:11 +02:00
|
|
|
|
'popup': 'popup',
|
|
|
|
|
'script': 'script',
|
|
|
|
|
'stylesheet': 'stylesheet',
|
|
|
|
|
'subdocument': 'sub_frame',
|
|
|
|
|
'xmlhttprequest': 'xmlhttprequest',
|
|
|
|
|
'websocket': 'websocket'
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
FilterParser.prototype.reset = function() {
|
|
|
|
|
this.action = BlockAction;
|
|
|
|
|
this.anchor = 0;
|
2017-03-11 19:55:47 +01:00
|
|
|
|
this.badFilter = false;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.dataType = undefined;
|
|
|
|
|
this.dataStr = undefined;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
this.elemHiding = false;
|
|
|
|
|
this.f = '';
|
|
|
|
|
this.firstParty = false;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.thirdParty = false;
|
|
|
|
|
this.party = AnyParty;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
this.fopts = '';
|
2014-09-19 16:59:44 +02:00
|
|
|
|
this.hostnamePure = false;
|
2015-08-22 18:15:16 +02:00
|
|
|
|
this.domainOpt = '';
|
2015-01-23 17:32:49 +01:00
|
|
|
|
this.isRegex = false;
|
2015-11-24 01:18:25 +01:00
|
|
|
|
this.raw = '';
|
|
|
|
|
this.redirect = false;
|
2015-12-04 03:24:37 +01:00
|
|
|
|
this.token = '*';
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.tokenHash = this.noTokenHash;
|
2015-01-23 17:32:49 +01:00
|
|
|
|
this.tokenBeg = 0;
|
2015-01-24 03:47:56 +01:00
|
|
|
|
this.types = 0;
|
2014-08-29 21:02:31 +02:00
|
|
|
|
this.important = 0;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
this.unsupported = false;
|
|
|
|
|
return this;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2016-08-31 01:57:25 +02:00
|
|
|
|
FilterParser.prototype.bitFromType = function(type) {
|
|
|
|
|
return 1 << ((typeNameToTypeValue[type] >>> 4) - 1);
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2015-04-07 03:26:05 +02:00
|
|
|
|
// https://github.com/chrisaljoudi/uBlock/issues/589
|
2015-01-24 03:47:56 +01:00
|
|
|
|
// Be ready to handle multiple negated types
|
|
|
|
|
|
2017-01-09 15:53:57 +01:00
|
|
|
|
FilterParser.prototype.parseTypeOption = function(raw, not) {
|
2016-08-31 01:57:25 +02:00
|
|
|
|
var typeBit = this.bitFromType(this.toNormalizedType[raw]);
|
2015-01-24 03:47:56 +01:00
|
|
|
|
|
|
|
|
|
if ( !not ) {
|
2015-03-26 00:28:22 +01:00
|
|
|
|
this.types |= typeBit;
|
2015-01-24 03:47:56 +01:00
|
|
|
|
return;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
2015-01-24 03:47:56 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// Non-discrete network types can't be negated.
|
|
|
|
|
if ( (typeBit & allNetRequestTypesBitmap) === 0 ) {
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
2015-02-08 04:20:24 +01:00
|
|
|
|
// Negated type: set all valid network request type bits to 1
|
2016-03-15 16:18:34 +01:00
|
|
|
|
if (
|
|
|
|
|
(typeBit & allNetRequestTypesBitmap) !== 0 &&
|
|
|
|
|
(this.types & allNetRequestTypesBitmap) === 0
|
|
|
|
|
) {
|
|
|
|
|
this.types |= allNetRequestTypesBitmap;
|
2015-01-24 03:47:56 +01:00
|
|
|
|
}
|
2016-03-15 16:18:34 +01:00
|
|
|
|
this.types &= ~typeBit;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-01-09 15:53:57 +01:00
|
|
|
|
FilterParser.prototype.parsePartyOption = function(firstParty, not) {
|
2015-06-07 00:31:38 +02:00
|
|
|
|
if ( firstParty ) {
|
|
|
|
|
not = !not;
|
|
|
|
|
}
|
2014-06-24 00:42:43 +02:00
|
|
|
|
if ( not ) {
|
|
|
|
|
this.firstParty = true;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.party = this.thirdParty ? AnyParty : FirstParty;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
} else {
|
|
|
|
|
this.thirdParty = true;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.party = this.firstParty ? AnyParty : ThirdParty;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-01-09 15:53:57 +01:00
|
|
|
|
FilterParser.prototype.parseDomainOption = function(s) {
|
|
|
|
|
if ( this.reHasUnicode.test(s) ) {
|
|
|
|
|
var hostnames = s.split('|'),
|
|
|
|
|
i = hostnames.length;
|
|
|
|
|
while ( i-- ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( this.reHasUnicode.test(hostnames[i]) ) {
|
|
|
|
|
hostnames[i] = punycode.toASCII(hostnames[i]);
|
|
|
|
|
}
|
2017-01-09 15:53:57 +01:00
|
|
|
|
}
|
|
|
|
|
s = hostnames.join('|');
|
|
|
|
|
}
|
|
|
|
|
if ( this.reBadDomainOptChars.test(s) ) {
|
|
|
|
|
return '';
|
|
|
|
|
}
|
|
|
|
|
return s;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2015-01-23 17:32:49 +01:00
|
|
|
|
FilterParser.prototype.parseOptions = function(s) {
|
|
|
|
|
this.fopts = s;
|
|
|
|
|
var opts = s.split(',');
|
|
|
|
|
var opt, not;
|
|
|
|
|
for ( var i = 0; i < opts.length; i++ ) {
|
|
|
|
|
opt = opts[i];
|
2015-12-15 16:40:40 +01:00
|
|
|
|
not = opt.startsWith('~');
|
2014-06-24 00:42:43 +02:00
|
|
|
|
if ( not ) {
|
2015-01-23 17:32:49 +01:00
|
|
|
|
opt = opt.slice(1);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
2015-01-23 17:32:49 +01:00
|
|
|
|
if ( opt === 'third-party' ) {
|
2017-01-09 15:53:57 +01:00
|
|
|
|
this.parsePartyOption(false, not);
|
2015-01-23 17:32:49 +01:00
|
|
|
|
continue;
|
|
|
|
|
}
|
2015-10-05 17:03:20 +02:00
|
|
|
|
// https://issues.adblockplus.org/ticket/616
|
2015-10-05 17:04:36 +02:00
|
|
|
|
// `generichide` concept already supported, just a matter of
|
2015-10-05 16:58:24 +02:00
|
|
|
|
// adding support for the new keyword.
|
2015-10-05 17:03:20 +02:00
|
|
|
|
if ( opt === 'elemhide' || opt === 'generichide' ) {
|
2016-11-08 13:13:26 +01:00
|
|
|
|
if ( not === false ) {
|
2017-01-09 15:53:57 +01:00
|
|
|
|
this.parseTypeOption('generichide', false);
|
2015-03-26 00:28:22 +01:00
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
this.unsupported = true;
|
|
|
|
|
break;
|
2015-01-23 17:32:49 +01:00
|
|
|
|
}
|
2015-07-13 14:49:58 +02:00
|
|
|
|
if ( opt === 'document' ) {
|
|
|
|
|
if ( this.action === BlockAction ) {
|
2017-01-09 15:53:57 +01:00
|
|
|
|
this.parseTypeOption('document', not);
|
2015-07-13 14:49:58 +02:00
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
this.unsupported = true;
|
|
|
|
|
break;
|
|
|
|
|
}
|
2015-01-23 17:32:49 +01:00
|
|
|
|
if ( this.toNormalizedType.hasOwnProperty(opt) ) {
|
2017-01-09 15:53:57 +01:00
|
|
|
|
this.parseTypeOption(opt, not);
|
2016-08-31 01:57:25 +02:00
|
|
|
|
// Due to ABP categorizing `websocket` requests as `other`, we need
|
|
|
|
|
// to add `websocket` for when `other` is used.
|
|
|
|
|
if ( opt === 'other' ) {
|
2017-01-09 15:53:57 +01:00
|
|
|
|
this.parseTypeOption('websocket', not);
|
2016-08-31 01:57:25 +02:00
|
|
|
|
}
|
2015-01-23 17:32:49 +01:00
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-01-09 14:56:42 +01:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/2294
|
|
|
|
|
// Detect and discard filter if domain option contains nonsensical
|
|
|
|
|
// characters.
|
2015-12-15 16:40:40 +01:00
|
|
|
|
if ( opt.startsWith('domain=') ) {
|
2017-01-09 15:53:57 +01:00
|
|
|
|
this.domainOpt = this.parseDomainOption(opt.slice(7));
|
|
|
|
|
if ( this.domainOpt === '' ) {
|
2017-01-09 14:56:42 +01:00
|
|
|
|
this.unsupported = true;
|
|
|
|
|
break;
|
|
|
|
|
}
|
2015-01-23 17:32:49 +01:00
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
if ( opt === 'important' ) {
|
|
|
|
|
this.important = Important;
|
|
|
|
|
continue;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
2015-06-07 00:31:38 +02:00
|
|
|
|
if ( opt === 'first-party' ) {
|
2017-01-09 15:53:57 +01:00
|
|
|
|
this.parsePartyOption(true, not);
|
2015-06-07 00:31:38 +02:00
|
|
|
|
continue;
|
|
|
|
|
}
|
2015-12-15 16:40:40 +01:00
|
|
|
|
if ( opt.startsWith('redirect=') ) {
|
2015-11-24 05:34:03 +01:00
|
|
|
|
if ( this.action === BlockAction ) {
|
|
|
|
|
this.redirect = true;
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
this.unsupported = true;
|
|
|
|
|
break;
|
2015-11-24 01:18:25 +01:00
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( opt.startsWith('csp=') ) {
|
2017-05-16 18:44:12 +02:00
|
|
|
|
if ( opt.length > 4 && this.reBadCSP.test(opt) === false ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.parseTypeOption('data', not);
|
|
|
|
|
this.dataType = 'csp';
|
|
|
|
|
this.dataStr = opt.slice(4).trim();
|
|
|
|
|
}
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
if ( opt === 'csp' && this.action === AllowAction ) {
|
|
|
|
|
this.parseTypeOption('data', not);
|
|
|
|
|
this.dataType = 'csp';
|
|
|
|
|
this.dataStr = '';
|
|
|
|
|
continue;
|
|
|
|
|
}
|
2015-12-18 18:19:13 +01:00
|
|
|
|
// Used by Adguard, purpose is unclear -- just ignore for now.
|
|
|
|
|
if ( opt === 'empty' ) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-03-11 19:55:47 +01:00
|
|
|
|
// https://github.com/uBlockOrigin/uAssets/issues/192
|
|
|
|
|
if ( opt === 'badfilter' ) {
|
|
|
|
|
this.badFilter = true;
|
|
|
|
|
continue;
|
|
|
|
|
}
|
2015-11-24 05:34:03 +01:00
|
|
|
|
// Unrecognized filter option: ignore whole filter.
|
2015-01-23 17:32:49 +01:00
|
|
|
|
this.unsupported = true;
|
|
|
|
|
break;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1943#issuecomment-243188946
|
|
|
|
|
// Convert websocket-related filter where possible to a format which
|
|
|
|
|
// can be handled using CSP injection.
|
|
|
|
|
|
|
|
|
|
FilterParser.prototype.translate = function() {
|
|
|
|
|
var dataTypeBit = this.bitFromType('data');
|
|
|
|
|
|
|
|
|
|
if ( this.cantWebsocket && this.reWebsocketAny.test(this.f) ) {
|
|
|
|
|
this.f = '*';
|
|
|
|
|
this.types = dataTypeBit;
|
|
|
|
|
this.dataType = 'csp';
|
|
|
|
|
this.dataStr = "connect-src https: http:";
|
|
|
|
|
// https://bugs.chromium.org/p/chromium/issues/detail?id=669086
|
|
|
|
|
// TODO: remove when most users are beyond Chromium v56
|
|
|
|
|
if ( vAPI.chromiumVersion < 57 ) {
|
|
|
|
|
this.dataStr += '; frame-src *';
|
|
|
|
|
}
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Broad |data:-based filters.
|
|
|
|
|
if ( this.f === 'data:' ) {
|
|
|
|
|
switch ( this.types ) {
|
|
|
|
|
case 0:
|
|
|
|
|
this.f = '*';
|
|
|
|
|
this.types = dataTypeBit;
|
|
|
|
|
this.dataType = 'csp';
|
|
|
|
|
this.dataStr = "default-src 'self' * blob: 'unsafe-inline' 'unsafe-eval'";
|
|
|
|
|
break;
|
|
|
|
|
case this.bitFromType('script'):
|
|
|
|
|
this.f = '*';
|
|
|
|
|
this.types = dataTypeBit;
|
|
|
|
|
this.dataType = 'csp';
|
|
|
|
|
this.dataStr = "script-src 'self' * blob: 'unsafe-inline' 'unsafe-eval'";
|
|
|
|
|
break;
|
|
|
|
|
case this.bitFromType('sub_frame'):
|
|
|
|
|
this.f = '*';
|
|
|
|
|
this.types = dataTypeBit;
|
|
|
|
|
this.dataType = 'csp';
|
|
|
|
|
this.dataStr = "frame-src 'self' * blob:";
|
|
|
|
|
break;
|
|
|
|
|
case this.bitFromType('script') | this.bitFromType('sub_frame'):
|
|
|
|
|
this.f = '*';
|
|
|
|
|
this.types = dataTypeBit;
|
|
|
|
|
this.dataType = 'csp';
|
|
|
|
|
this.dataStr = "frame-src 'self' * blob:; script-src 'self' * blob: 'unsafe-inline' 'unsafe-eval';";
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Broad |blob:-based filters.
|
|
|
|
|
if ( this.f === 'blob:' ) {
|
|
|
|
|
switch ( this.types ) {
|
|
|
|
|
case 0:
|
|
|
|
|
this.f = '*';
|
|
|
|
|
this.types = dataTypeBit;
|
|
|
|
|
this.dataType = 'csp';
|
|
|
|
|
this.dataStr = "default-src 'self' * data: 'unsafe-inline' 'unsafe-eval'";
|
|
|
|
|
break;
|
|
|
|
|
case this.bitFromType('script'):
|
|
|
|
|
this.f = '*';
|
|
|
|
|
this.types = dataTypeBit;
|
|
|
|
|
this.dataType = 'csp';
|
|
|
|
|
this.dataStr = "script-src 'self' * data: 'unsafe-inline' 'unsafe-eval'";
|
|
|
|
|
break;
|
|
|
|
|
case this.bitFromType('sub_frame'):
|
|
|
|
|
this.f = '*';
|
|
|
|
|
this.types = dataTypeBit;
|
|
|
|
|
this.dataType = 'csp';
|
|
|
|
|
this.dataStr = "frame-src 'self' * data:";
|
|
|
|
|
break;
|
|
|
|
|
case this.bitFromType('script') | this.bitFromType('sub_frame'):
|
|
|
|
|
this.f = '*';
|
|
|
|
|
this.types = dataTypeBit;
|
|
|
|
|
this.dataType = 'csp';
|
|
|
|
|
this.dataStr = "frame-src 'self' * data:; script-src 'self' * data: 'unsafe-inline' 'unsafe-eval';";
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/*******************************************************************************
|
|
|
|
|
|
|
|
|
|
anchor: bit vector
|
|
|
|
|
0000 (0x0): no anchoring
|
|
|
|
|
0001 (0x1): anchored to the end of the URL.
|
|
|
|
|
0010 (0x2): anchored to the start of the URL.
|
|
|
|
|
0011 (0x3): anchored to the start and end of the URL.
|
|
|
|
|
0100 (0x4): anchored to the hostname of the URL.
|
|
|
|
|
0101 (0x5): anchored to the hostname and end of the URL.
|
|
|
|
|
|
|
|
|
|
**/
|
|
|
|
|
|
2015-02-27 00:08:42 +01:00
|
|
|
|
FilterParser.prototype.parse = function(raw) {
|
2014-06-24 00:42:43 +02:00
|
|
|
|
// important!
|
|
|
|
|
this.reset();
|
|
|
|
|
|
2015-11-24 01:18:25 +01:00
|
|
|
|
var s = this.raw = raw;
|
2015-02-27 00:08:42 +01:00
|
|
|
|
|
2015-12-13 18:55:55 +01:00
|
|
|
|
// plain hostname? (from HOSTS file)
|
|
|
|
|
if ( this.reHostnameRule1.test(s) ) {
|
2014-09-19 16:59:44 +02:00
|
|
|
|
this.f = s;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.hostnamePure = true;
|
|
|
|
|
this.anchor |= 0x4;
|
2014-09-19 16:59:44 +02:00
|
|
|
|
return this;
|
|
|
|
|
}
|
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
// element hiding filter?
|
2015-01-23 17:32:49 +01:00
|
|
|
|
var pos = s.indexOf('#');
|
|
|
|
|
if ( pos !== -1 ) {
|
|
|
|
|
var c = s.charAt(pos + 1);
|
|
|
|
|
if ( c === '#' || c === '@' ) {
|
|
|
|
|
console.error('static-net-filtering.js > unexpected cosmetic filters');
|
|
|
|
|
this.elemHiding = true;
|
|
|
|
|
return this;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2015-01-24 03:47:56 +01:00
|
|
|
|
// block or allow filter?
|
|
|
|
|
// Important: this must be executed before parsing options
|
2015-12-15 16:40:40 +01:00
|
|
|
|
if ( s.startsWith('@@') ) {
|
2015-01-24 03:47:56 +01:00
|
|
|
|
this.action = AllowAction;
|
|
|
|
|
s = s.slice(2);
|
|
|
|
|
}
|
|
|
|
|
|
2015-01-23 17:32:49 +01:00
|
|
|
|
// options
|
2015-11-06 16:49:09 +01:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/842
|
|
|
|
|
// - ensure sure we are not dealing with a regex-based filter.
|
|
|
|
|
// - lookup the last occurrence of `$`.
|
2015-12-15 16:40:40 +01:00
|
|
|
|
if ( s.startsWith('/') === false || s.endsWith('/') === false ) {
|
2015-11-06 16:49:09 +01:00
|
|
|
|
pos = s.lastIndexOf('$');
|
|
|
|
|
if ( pos !== -1 ) {
|
2015-11-30 20:47:56 +01:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/952
|
|
|
|
|
// Discard Adguard-specific `$$` filters.
|
|
|
|
|
if ( s.indexOf('$$') !== -1 ) {
|
|
|
|
|
this.unsupported = true;
|
|
|
|
|
return this;
|
|
|
|
|
}
|
2015-11-06 16:49:09 +01:00
|
|
|
|
this.parseOptions(s.slice(pos + 1));
|
|
|
|
|
s = s.slice(0, pos);
|
|
|
|
|
}
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
|
|
|
|
|
2015-01-23 17:32:49 +01:00
|
|
|
|
// regex?
|
2015-12-15 16:40:40 +01:00
|
|
|
|
if ( s.startsWith('/') && s.endsWith('/') && s.length > 2 ) {
|
2015-01-23 17:32:49 +01:00
|
|
|
|
this.isRegex = true;
|
|
|
|
|
this.f = s.slice(1, -1);
|
2016-01-17 02:21:17 +01:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1246
|
|
|
|
|
// If the filter is valid, use the corrected version of the source
|
|
|
|
|
// string -- this ensure reverse-lookup will work fine.
|
|
|
|
|
this.f = normalizeRegexSource(this.f);
|
|
|
|
|
if ( this.f === '' ) {
|
2015-10-26 16:23:56 +01:00
|
|
|
|
console.error(
|
|
|
|
|
"uBlock Origin> discarding bad regular expression-based network filter '%s': '%s'",
|
|
|
|
|
raw,
|
2016-01-17 02:21:17 +01:00
|
|
|
|
normalizeRegexSource.message
|
2015-10-26 16:23:56 +01:00
|
|
|
|
);
|
|
|
|
|
this.unsupported = true;
|
|
|
|
|
}
|
2014-09-08 23:46:58 +02:00
|
|
|
|
return this;
|
|
|
|
|
}
|
|
|
|
|
|
2015-02-27 00:08:42 +01:00
|
|
|
|
// hostname-anchored
|
2015-12-15 16:40:40 +01:00
|
|
|
|
if ( s.startsWith('||') ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.anchor |= 0x4;
|
2015-12-13 18:55:55 +01:00
|
|
|
|
s = s.slice(2);
|
|
|
|
|
|
2015-02-27 00:08:42 +01:00
|
|
|
|
// convert hostname to punycode if needed
|
2017-05-09 14:58:30 +02:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/2599
|
2015-02-27 00:08:42 +01:00
|
|
|
|
if ( this.reHasUnicode.test(s) ) {
|
|
|
|
|
var matches = this.reIsolateHostname.exec(s);
|
2015-12-13 18:55:55 +01:00
|
|
|
|
if ( matches ) {
|
2017-05-09 14:58:30 +02:00
|
|
|
|
s = (matches[1] !== undefined ? matches[1] : '') +
|
|
|
|
|
punycode.toASCII(matches[2]) +
|
|
|
|
|
matches[3];
|
2015-02-27 00:08:42 +01:00
|
|
|
|
//console.debug('µBlock.staticNetFilteringEngine/FilterParser.parse():', raw, '=', s);
|
|
|
|
|
}
|
|
|
|
|
}
|
2015-03-26 20:16:48 +01:00
|
|
|
|
|
2015-04-07 03:26:05 +02:00
|
|
|
|
// https://github.com/chrisaljoudi/uBlock/issues/1096
|
2015-12-15 16:40:40 +01:00
|
|
|
|
if ( s.startsWith('^') ) {
|
2015-03-26 20:16:48 +01:00
|
|
|
|
this.unsupported = true;
|
|
|
|
|
return this;
|
|
|
|
|
}
|
2015-12-13 18:55:55 +01:00
|
|
|
|
|
|
|
|
|
// plain hostname? (from ABP filter list)
|
2016-06-27 03:15:18 +02:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1757
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// A filter can't be a pure-hostname one if there is a domain or csp
|
|
|
|
|
// option present.
|
|
|
|
|
if ( this.reHostnameRule2.test(s) ) {
|
2015-12-13 18:55:55 +01:00
|
|
|
|
this.f = s.replace(this.reCleanupHostnameRule2, '');
|
|
|
|
|
this.hostnamePure = true;
|
|
|
|
|
return this;
|
|
|
|
|
}
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
|
|
|
|
// left-anchored
|
2017-05-12 16:35:11 +02:00
|
|
|
|
else if ( s.startsWith('|') ) {
|
|
|
|
|
this.anchor |= 0x2;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
s = s.slice(1);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// right-anchored
|
2015-12-15 16:40:40 +01:00
|
|
|
|
if ( s.endsWith('|') ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.anchor |= 0x1;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
s = s.slice(0, -1);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// normalize placeholders
|
2015-01-23 17:32:49 +01:00
|
|
|
|
if ( this.reHasWildcard.test(s) ) {
|
2015-12-05 18:25:18 +01:00
|
|
|
|
// remove pointless leading *
|
2016-06-27 20:11:36 +02:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1669#issuecomment-224822448
|
|
|
|
|
// Keep the leading asterisk if we are dealing with a hostname-anchored
|
|
|
|
|
// filter, this will ensure the generic filter implementation is
|
|
|
|
|
// used.
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( s.startsWith('*') && (this.anchor & 0x4) ) {
|
2015-12-05 18:25:18 +01:00
|
|
|
|
s = s.replace(/^\*+([^%0-9a-z])/, '$1');
|
|
|
|
|
}
|
|
|
|
|
// remove pointless trailing *
|
2015-12-15 16:40:40 +01:00
|
|
|
|
if ( s.endsWith('*') ) {
|
2015-12-05 18:25:18 +01:00
|
|
|
|
s = s.replace(/([^%0-9a-z])\*+$/, '$1');
|
|
|
|
|
}
|
2015-01-23 17:32:49 +01:00
|
|
|
|
}
|
2014-09-19 16:59:44 +02:00
|
|
|
|
|
2015-02-14 00:59:51 +01:00
|
|
|
|
// nothing left?
|
|
|
|
|
if ( s === '' ) {
|
2015-03-17 14:39:03 +01:00
|
|
|
|
s = '*';
|
2015-02-14 00:59:51 +01:00
|
|
|
|
}
|
|
|
|
|
|
2015-12-11 12:36:28 +01:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1047
|
|
|
|
|
// Hostname-anchored makes no sense if matching all requests.
|
|
|
|
|
if ( s === '*' ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.anchor = 0;
|
2015-12-11 12:36:28 +01:00
|
|
|
|
}
|
|
|
|
|
|
2015-01-23 17:32:49 +01:00
|
|
|
|
// This might look weird but we gain memory footprint by not going through
|
|
|
|
|
// toLowerCase(), at least on Chromium. Because copy-on-write?
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
2015-01-23 17:32:49 +01:00
|
|
|
|
this.f = this.reHasUppercase.test(s) ? s.toLowerCase() : s;
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// Convenience:
|
|
|
|
|
// Convert special broad filters for non-webRequest aware types into
|
|
|
|
|
// `csp` filters wherever possible.
|
|
|
|
|
if ( this.anchor & 0x2 && this.party === 0 ) {
|
|
|
|
|
this.translate();
|
2016-08-31 01:57:25 +02:00
|
|
|
|
}
|
|
|
|
|
|
2015-01-23 17:32:49 +01:00
|
|
|
|
return this;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2015-03-02 16:41:51 +01:00
|
|
|
|
// Given a string, find a good token. Tokens which are too generic, i.e. very
|
|
|
|
|
// common with a high probability of ending up as a miss, are not
|
|
|
|
|
// good. Avoid if possible. This has a *significant* positive impact on
|
|
|
|
|
// performance.
|
|
|
|
|
// These "bad tokens" are collated manually.
|
|
|
|
|
|
2015-12-04 03:24:37 +01:00
|
|
|
|
// Hostname-anchored with no wildcard always have a token index of 0.
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var reHostnameToken = /^[0-9a-z]+/;
|
2015-03-02 16:41:51 +01:00
|
|
|
|
var reGoodToken = /[%0-9a-z]{2,}/g;
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var badTokens = new Set([
|
|
|
|
|
'com',
|
|
|
|
|
'http',
|
|
|
|
|
'https',
|
|
|
|
|
'icon',
|
|
|
|
|
'images',
|
|
|
|
|
'img',
|
|
|
|
|
'js',
|
|
|
|
|
'net',
|
|
|
|
|
'news',
|
|
|
|
|
'www'
|
|
|
|
|
]);
|
2015-03-02 16:41:51 +01:00
|
|
|
|
|
|
|
|
|
var findFirstGoodToken = function(s) {
|
|
|
|
|
reGoodToken.lastIndex = 0;
|
2015-12-03 16:06:06 +01:00
|
|
|
|
var matches, lpos;
|
2015-12-04 03:24:37 +01:00
|
|
|
|
var badTokenMatch = null;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
while ( (matches = reGoodToken.exec(s)) !== null ) {
|
2015-12-03 16:06:06 +01:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/997
|
|
|
|
|
// Ignore token if preceded by wildcard.
|
|
|
|
|
lpos = matches.index;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( lpos !== 0 && s.charCodeAt(lpos - 1) === 0x2A /* '*' */ ) {
|
2015-12-03 16:06:06 +01:00
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( s.charCodeAt(reGoodToken.lastIndex) === 0x2A /* '*' */ ) {
|
2015-03-02 22:22:23 +01:00
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( badTokens.has(matches[0]) ) {
|
2015-12-04 03:24:37 +01:00
|
|
|
|
if ( badTokenMatch === null ) {
|
|
|
|
|
badTokenMatch = matches;
|
|
|
|
|
}
|
2015-03-02 16:41:51 +01:00
|
|
|
|
continue;
|
|
|
|
|
}
|
2015-03-02 22:22:23 +01:00
|
|
|
|
return matches;
|
|
|
|
|
}
|
2015-12-04 03:24:37 +01:00
|
|
|
|
return badTokenMatch;
|
2015-03-02 16:41:51 +01:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
var findHostnameToken = function(s) {
|
|
|
|
|
return reHostnameToken.exec(s);
|
|
|
|
|
};
|
|
|
|
|
|
2015-03-02 22:22:23 +01:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2015-01-23 17:32:49 +01:00
|
|
|
|
FilterParser.prototype.makeToken = function() {
|
2015-04-07 03:26:05 +02:00
|
|
|
|
// https://github.com/chrisaljoudi/uBlock/issues/1038
|
2015-12-04 03:24:37 +01:00
|
|
|
|
// Single asterisk will match any URL.
|
|
|
|
|
if ( this.isRegex || this.f === '*' ) {
|
2015-03-17 14:39:03 +01:00
|
|
|
|
return;
|
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var matches = this.anchor & 0x4 && this.f.indexOf('*') === -1 ?
|
2015-12-04 03:24:37 +01:00
|
|
|
|
findHostnameToken(this.f) :
|
|
|
|
|
findFirstGoodToken(this.f);
|
2015-01-23 17:32:49 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( matches !== null ) {
|
2015-12-04 03:24:37 +01:00
|
|
|
|
this.token = matches[0];
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.tokenHash = µb.urlTokenizer.tokenHashFromString(this.token);
|
2015-01-23 17:32:49 +01:00
|
|
|
|
this.tokenBeg = matches.index;
|
|
|
|
|
}
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
var FilterContainer = function() {
|
2015-12-05 18:25:18 +01:00
|
|
|
|
this.reIsGeneric = /[\^\*]/;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
this.filterParser = new FilterParser();
|
2015-12-29 17:34:41 +01:00
|
|
|
|
this.urlTokenizer = µb.urlTokenizer;
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.noTokenHash = this.urlTokenizer.tokenHashFromString('*');
|
|
|
|
|
this.dotTokenHash = this.urlTokenizer.tokenHashFromString('.');
|
|
|
|
|
this.exportedDotTokenHash = exportInt(this.dotTokenHash);
|
2014-07-20 21:00:26 +02:00
|
|
|
|
this.reset();
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
// Reset all, thus reducing to a minimum memory footprint of the context.
|
|
|
|
|
|
|
|
|
|
FilterContainer.prototype.reset = function() {
|
|
|
|
|
this.frozen = false;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
this.processedFilterCount = 0;
|
2014-07-16 16:43:34 +02:00
|
|
|
|
this.acceptedCount = 0;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
this.rejectedCount = 0;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
this.allowFilterCount = 0;
|
|
|
|
|
this.blockFilterCount = 0;
|
2016-03-17 18:56:21 +01:00
|
|
|
|
this.discardedCount = 0;
|
2017-03-11 19:55:47 +01:00
|
|
|
|
this.badFilters = new Set();
|
2016-09-12 16:22:25 +02:00
|
|
|
|
this.duplicateBuster = new Set();
|
|
|
|
|
this.categories = new Map();
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.dataFilters = new Map();
|
2014-07-20 21:00:26 +02:00
|
|
|
|
this.filterParser.reset();
|
2015-06-09 16:27:08 +02:00
|
|
|
|
|
2017-01-06 18:39:37 +01:00
|
|
|
|
// Reuse filter instances whenever possible at load time.
|
|
|
|
|
this.fclassLast = null;
|
|
|
|
|
this.fdataLast = null;
|
|
|
|
|
this.filterLast = null;
|
|
|
|
|
|
2015-06-09 16:27:08 +02:00
|
|
|
|
// Runtime registers
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = undefined;
|
|
|
|
|
this.thRegister = undefined;
|
2015-06-09 16:27:08 +02:00
|
|
|
|
this.fRegister = null;
|
2014-07-20 21:00:26 +02:00
|
|
|
|
};
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
2014-07-20 21:00:26 +02:00
|
|
|
|
/******************************************************************************/
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
2014-07-20 21:00:26 +02:00
|
|
|
|
FilterContainer.prototype.freeze = function() {
|
2014-09-21 20:03:41 +02:00
|
|
|
|
histogram('allFilters', this.categories);
|
2017-03-11 19:55:47 +01:00
|
|
|
|
this.removeBadFilters();
|
2016-09-12 16:22:25 +02:00
|
|
|
|
this.duplicateBuster = new Set();
|
2014-07-20 21:00:26 +02:00
|
|
|
|
this.filterParser.reset();
|
2017-01-06 18:39:37 +01:00
|
|
|
|
this.fclassLast = null;
|
|
|
|
|
this.fdataLast = null;
|
|
|
|
|
this.filterLast = null;
|
2014-07-20 21:00:26 +02:00
|
|
|
|
this.frozen = true;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
//console.log(JSON.stringify(Array.from(filterClassHistogram)));
|
|
|
|
|
//this.tokenHistogram = new Map(Array.from(this.tokenHistogram).sort(function(a, b) {
|
|
|
|
|
// return a[0].localeCompare(b[0]) || (b[1] - a[1]);
|
|
|
|
|
//}));
|
2017-01-06 18:39:37 +01:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2014-09-08 23:46:58 +02:00
|
|
|
|
FilterContainer.prototype.toSelfie = function() {
|
2016-09-12 16:22:25 +02:00
|
|
|
|
var categoryToSelfie = function(map) {
|
|
|
|
|
var selfie = [],
|
|
|
|
|
iterator = map.entries(),
|
2017-05-12 16:35:11 +02:00
|
|
|
|
entry;
|
2016-09-12 16:22:25 +02:00
|
|
|
|
for (;;) {
|
|
|
|
|
entry = iterator.next();
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( entry.done === true ) { break; }
|
2017-05-19 14:45:19 +02:00
|
|
|
|
selfie.push('k2\t' + exportInt(entry.value[0])); // token hash
|
2017-05-12 16:35:11 +02:00
|
|
|
|
selfie.push(entry.value[1].compile());
|
2014-09-08 23:46:58 +02:00
|
|
|
|
}
|
|
|
|
|
return selfie.join('\n');
|
|
|
|
|
};
|
|
|
|
|
|
2016-09-12 16:22:25 +02:00
|
|
|
|
var categoriesToSelfie = function(map) {
|
|
|
|
|
var selfie = [],
|
|
|
|
|
iterator = map.entries(),
|
|
|
|
|
entry;
|
|
|
|
|
for (;;) {
|
|
|
|
|
entry = iterator.next();
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( entry.done === true ) { break; }
|
2017-05-19 14:45:19 +02:00
|
|
|
|
selfie.push('k1\t' + exportInt(entry.value[0])); // category bits
|
2016-09-12 16:22:25 +02:00
|
|
|
|
selfie.push(categoryToSelfie(entry.value[1]));
|
2014-09-08 23:46:58 +02:00
|
|
|
|
}
|
|
|
|
|
return selfie.join('\n');
|
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var dataFiltersToSelfie = function(dataFilters) {
|
|
|
|
|
var selfie = [],
|
|
|
|
|
iter = dataFilters.entries(),
|
|
|
|
|
entry;
|
|
|
|
|
for (;;) {
|
|
|
|
|
entry = iter.next();
|
|
|
|
|
if ( entry.done === true ) { break; }
|
|
|
|
|
entry = entry.value[1];
|
|
|
|
|
do {
|
|
|
|
|
selfie.push(entry.compile());
|
|
|
|
|
entry = entry.next;
|
|
|
|
|
} while ( entry !== undefined );
|
|
|
|
|
}
|
|
|
|
|
return selfie;
|
|
|
|
|
};
|
|
|
|
|
|
2014-09-08 23:46:58 +02:00
|
|
|
|
return {
|
|
|
|
|
processedFilterCount: this.processedFilterCount,
|
|
|
|
|
acceptedCount: this.acceptedCount,
|
|
|
|
|
rejectedCount: this.rejectedCount,
|
|
|
|
|
allowFilterCount: this.allowFilterCount,
|
|
|
|
|
blockFilterCount: this.blockFilterCount,
|
2016-03-17 18:56:21 +01:00
|
|
|
|
discardedCount: this.discardedCount,
|
2017-05-12 16:35:11 +02:00
|
|
|
|
categories: categoriesToSelfie(this.categories),
|
|
|
|
|
dataFilters: dataFiltersToSelfie(this.dataFilters)
|
2014-09-08 23:46:58 +02:00
|
|
|
|
};
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
FilterContainer.prototype.fromSelfie = function(selfie) {
|
|
|
|
|
this.frozen = true;
|
|
|
|
|
this.processedFilterCount = selfie.processedFilterCount;
|
|
|
|
|
this.acceptedCount = selfie.acceptedCount;
|
|
|
|
|
this.rejectedCount = selfie.rejectedCount;
|
|
|
|
|
this.allowFilterCount = selfie.allowFilterCount;
|
|
|
|
|
this.blockFilterCount = selfie.blockFilterCount;
|
2016-03-17 18:56:21 +01:00
|
|
|
|
this.discardedCount = selfie.discardedCount;
|
2014-09-08 23:46:58 +02:00
|
|
|
|
|
2017-05-19 14:45:19 +02:00
|
|
|
|
var categoryBits, tokenHash,
|
2017-05-12 16:35:11 +02:00
|
|
|
|
map = this.categories, submap,
|
|
|
|
|
lineIter = new µb.LineIterator(selfie.categories),
|
|
|
|
|
line;
|
|
|
|
|
while ( lineIter.eot() === false ) {
|
|
|
|
|
line = lineIter.next();
|
2017-05-19 14:45:19 +02:00
|
|
|
|
if ( line.startsWith('k1\t') ) { // category bits
|
|
|
|
|
categoryBits = importInt(line.slice(3));
|
2016-09-12 16:22:25 +02:00
|
|
|
|
submap = new Map();
|
2017-05-19 14:45:19 +02:00
|
|
|
|
map.set(categoryBits, submap);
|
2014-09-08 23:46:58 +02:00
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
if ( line.startsWith('k2\t') ) { // token hash
|
|
|
|
|
tokenHash = importInt(line.slice(3));
|
2014-09-08 23:46:58 +02:00
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
submap.set(tokenHash, filterFromCompiledData(line));
|
2015-12-05 18:25:18 +01:00
|
|
|
|
}
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var i = selfie.dataFilters.length,
|
|
|
|
|
entry, bucket;
|
|
|
|
|
while ( i-- ) {
|
|
|
|
|
entry = FilterDataHolderEntry.load(selfie.dataFilters[i]);
|
2017-05-19 14:45:19 +02:00
|
|
|
|
bucket = this.dataFilters.get(entry.tokenHash);
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( bucket !== undefined ) {
|
|
|
|
|
entry.next = bucket;
|
2016-10-04 05:41:23 +02:00
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.dataFilters.set(entry.tokenHash, entry);
|
2015-12-05 18:25:18 +01:00
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2015-02-24 00:31:29 +01:00
|
|
|
|
FilterContainer.prototype.compile = function(raw, out) {
|
2014-06-24 00:42:43 +02:00
|
|
|
|
// ORDER OF TESTS IS IMPORTANT!
|
|
|
|
|
|
|
|
|
|
// Ignore empty lines
|
2015-02-01 00:34:46 +01:00
|
|
|
|
var s = raw.trim();
|
2015-01-23 17:32:49 +01:00
|
|
|
|
if ( s.length === 0 ) {
|
2014-06-24 00:42:43 +02:00
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
var parsed = this.filterParser.parse(s);
|
|
|
|
|
|
2015-01-23 17:32:49 +01:00
|
|
|
|
// Ignore element-hiding filters
|
|
|
|
|
if ( parsed.elemHiding ) {
|
2014-09-08 23:46:58 +02:00
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2015-01-23 17:32:49 +01:00
|
|
|
|
// Ignore filters with unsupported options
|
|
|
|
|
if ( parsed.unsupported ) {
|
2017-01-09 14:56:42 +01:00
|
|
|
|
µb.logger.writeOne('', 'error', 'Network filtering – invalid filter: ' + raw);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2017-03-11 19:55:47 +01:00
|
|
|
|
// Pure hostnames, use more efficient dictionary lookup
|
2015-04-07 03:26:05 +02:00
|
|
|
|
// https://github.com/chrisaljoudi/uBlock/issues/665
|
2015-02-05 00:06:31 +01:00
|
|
|
|
// Create a dict keyed on request type etc.
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if (
|
|
|
|
|
parsed.hostnamePure &&
|
|
|
|
|
parsed.domainOpt === '' &&
|
|
|
|
|
parsed.dataType === undefined &&
|
|
|
|
|
this.compileHostnameOnlyFilter(parsed, out)
|
|
|
|
|
) {
|
2015-02-05 00:06:31 +01:00
|
|
|
|
return true;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
parsed.makeToken();
|
|
|
|
|
|
|
|
|
|
var fdata = '';
|
|
|
|
|
if ( parsed.dataType !== undefined ) {
|
|
|
|
|
if ( fdata !== '' ) { fdata += '\v'; }
|
|
|
|
|
fdata += FilterDataHolder.compile(parsed);
|
|
|
|
|
}
|
|
|
|
|
if ( parsed.domainOpt !== '' ) {
|
|
|
|
|
if ( fdata !== '' ) { fdata += '\v'; }
|
|
|
|
|
fdata += FilterOrigin.compile(parsed);
|
|
|
|
|
}
|
|
|
|
|
if ( fdata !== '' ) { fdata += '\v'; }
|
|
|
|
|
if ( parsed.isRegex ) {
|
|
|
|
|
fdata += FilterRegex.compile(parsed);
|
|
|
|
|
} else if ( parsed.hostnamePure ) {
|
|
|
|
|
fdata += FilterPlainHostname.compile(parsed);
|
|
|
|
|
} else if ( parsed.f === '*' ) {
|
|
|
|
|
fdata += FilterTrue.compile();
|
|
|
|
|
} else if ( parsed.anchor === 0x5 ) {
|
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1669
|
|
|
|
|
fdata += FilterGenericHnAndRightAnchored.compile(parsed);
|
2017-05-19 14:45:19 +02:00
|
|
|
|
} else if (
|
|
|
|
|
this.reIsGeneric.test(parsed.f) ||
|
|
|
|
|
parsed.tokenHash === parsed.noTokenHash
|
|
|
|
|
) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( parsed.anchor === 0x4 ) {
|
|
|
|
|
fdata += FilterGenericHnAnchored.compile(parsed);
|
|
|
|
|
} else {
|
|
|
|
|
fdata += FilterGeneric.compile(parsed);
|
|
|
|
|
}
|
|
|
|
|
} else if ( parsed.anchor === 0x4 ) {
|
|
|
|
|
fdata += FilterPlainHnAnchored.compile(parsed);
|
|
|
|
|
} else if ( parsed.anchor === 0x2 ) {
|
|
|
|
|
fdata += FilterPlainLeftAnchored.compile(parsed);
|
|
|
|
|
} else if ( parsed.anchor === 0x1 ) {
|
|
|
|
|
fdata += FilterPlainRightAnchored.compile(parsed);
|
|
|
|
|
} else if ( parsed.tokenBeg === 0 ) {
|
|
|
|
|
fdata += FilterPlainPrefix0.compile(parsed);
|
|
|
|
|
} else if ( parsed.tokenBeg === 1 ) {
|
|
|
|
|
fdata += FilterPlainPrefix1.compile(parsed);
|
|
|
|
|
} else {
|
|
|
|
|
fdata += FilterPlain.compile(parsed);
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
this.compileToAtomicFilter(fdata, parsed, out);
|
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
return true;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2015-02-05 00:06:31 +01:00
|
|
|
|
// Using fast/compact dictionary when filter is a (or portion of) pure hostname.
|
|
|
|
|
|
2015-02-24 00:31:29 +01:00
|
|
|
|
FilterContainer.prototype.compileHostnameOnlyFilter = function(parsed, out) {
|
2015-02-05 00:06:31 +01:00
|
|
|
|
// Can't fit the filter in a pure hostname dictionary.
|
2016-06-27 03:15:18 +02:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1757
|
2016-06-27 03:16:54 +02:00
|
|
|
|
// This should no longer happen with fix to above issue.
|
2016-06-27 03:15:18 +02:00
|
|
|
|
//if ( parsed.domainOpt.length !== 0 ) {
|
|
|
|
|
// return;
|
|
|
|
|
//}
|
2015-02-05 00:06:31 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var route = parsed.badFilter ? 0x01 : 0x00,
|
2017-05-19 14:45:19 +02:00
|
|
|
|
categoryBits = parsed.action | parsed.important | parsed.party;
|
2015-03-26 00:28:22 +01:00
|
|
|
|
|
|
|
|
|
var type = parsed.types;
|
|
|
|
|
if ( type === 0 ) {
|
|
|
|
|
out.push(
|
2017-05-12 16:35:11 +02:00
|
|
|
|
route,
|
2017-05-19 14:45:19 +02:00
|
|
|
|
exportInt(categoryBits) + '\v' +
|
|
|
|
|
this.exportedDotTokenHash + '\v' +
|
2015-03-26 00:28:22 +01:00
|
|
|
|
parsed.f
|
|
|
|
|
);
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
2015-02-05 00:06:31 +01:00
|
|
|
|
var bitOffset = 1;
|
2015-03-26 00:28:22 +01:00
|
|
|
|
do {
|
2015-02-05 00:06:31 +01:00
|
|
|
|
if ( type & 1 ) {
|
2015-02-24 00:31:29 +01:00
|
|
|
|
out.push(
|
2017-05-12 16:35:11 +02:00
|
|
|
|
route,
|
2017-05-19 14:45:19 +02:00
|
|
|
|
exportInt(categoryBits | (bitOffset << 4)) + '\v' +
|
|
|
|
|
this.exportedDotTokenHash + '\v' +
|
2015-02-24 00:31:29 +01:00
|
|
|
|
parsed.f
|
|
|
|
|
);
|
2015-02-05 00:06:31 +01:00
|
|
|
|
}
|
|
|
|
|
bitOffset += 1;
|
|
|
|
|
type >>>= 1;
|
2015-03-26 00:28:22 +01:00
|
|
|
|
} while ( type !== 0 );
|
2015-02-05 00:06:31 +01:00
|
|
|
|
return true;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterContainer.prototype.compileToAtomicFilter = function(fdata, parsed, out) {
|
|
|
|
|
var route = parsed.badFilter ? 0x01 : 0x00,
|
2017-05-19 14:45:19 +02:00
|
|
|
|
categoryBits = parsed.action | parsed.important | parsed.party,
|
2017-03-11 19:55:47 +01:00
|
|
|
|
type = parsed.types;
|
2015-03-26 00:28:22 +01:00
|
|
|
|
if ( type === 0 ) {
|
|
|
|
|
out.push(
|
2017-05-12 16:35:11 +02:00
|
|
|
|
route,
|
2017-05-19 14:45:19 +02:00
|
|
|
|
exportInt(categoryBits) + '\v' +
|
|
|
|
|
exportInt(parsed.tokenHash) + '\v' +
|
2017-05-12 16:35:11 +02:00
|
|
|
|
fdata
|
2015-03-26 00:28:22 +01:00
|
|
|
|
);
|
|
|
|
|
return;
|
|
|
|
|
}
|
2015-02-05 00:06:31 +01:00
|
|
|
|
var bitOffset = 1;
|
2015-03-26 00:28:22 +01:00
|
|
|
|
do {
|
2015-02-05 00:06:31 +01:00
|
|
|
|
if ( type & 1 ) {
|
2015-02-24 00:31:29 +01:00
|
|
|
|
out.push(
|
2017-05-12 16:35:11 +02:00
|
|
|
|
route,
|
2017-05-19 14:45:19 +02:00
|
|
|
|
exportInt(categoryBits | (bitOffset << 4)) + '\v' +
|
|
|
|
|
exportInt(parsed.tokenHash) + '\v' +
|
2017-05-12 16:35:11 +02:00
|
|
|
|
fdata
|
2015-02-24 00:31:29 +01:00
|
|
|
|
);
|
2015-01-24 03:47:56 +01:00
|
|
|
|
}
|
|
|
|
|
bitOffset += 1;
|
|
|
|
|
type >>>= 1;
|
2015-03-26 00:28:22 +01:00
|
|
|
|
} while ( type !== 0 );
|
2015-11-24 01:18:25 +01:00
|
|
|
|
|
|
|
|
|
// Only static filter with an explicit type can be redirected. If we reach
|
|
|
|
|
// this point, it's because there is one or more explicit type.
|
|
|
|
|
if ( !parsed.redirect ) {
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
2017-03-11 19:55:47 +01:00
|
|
|
|
if ( parsed.badFilter ) {
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
2015-11-24 01:18:25 +01:00
|
|
|
|
var redirects = µb.redirectEngine.compileRuleFromStaticFilter(parsed.raw);
|
2015-11-25 16:05:23 +01:00
|
|
|
|
if ( Array.isArray(redirects) === false ) {
|
|
|
|
|
return;
|
|
|
|
|
}
|
2015-11-24 01:18:25 +01:00
|
|
|
|
var i = redirects.length;
|
|
|
|
|
while ( i-- ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
out.push(0, '\v\v=>\t' + redirects[i]);
|
2015-11-24 01:18:25 +01:00
|
|
|
|
}
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2016-08-13 22:42:58 +02:00
|
|
|
|
FilterContainer.prototype.fromCompiledContent = function(lineIter) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
var line, lineBits, categoryBits, tokenHash, fdata,
|
2017-01-06 18:39:37 +01:00
|
|
|
|
bucket, entry, filter,
|
2017-05-12 16:35:11 +02:00
|
|
|
|
fieldIter = new µb.FieldIterator('\v'),
|
|
|
|
|
dataFilterFid = FilterDataHolder.fidPrefix,
|
|
|
|
|
buckerFilterFid = FilterBucket.fidPrefix,
|
|
|
|
|
aCharCode = 'a'.charCodeAt(0);
|
2015-02-24 00:31:29 +01:00
|
|
|
|
|
2016-08-13 22:42:58 +02:00
|
|
|
|
while ( lineIter.eot() === false ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
lineBits = lineIter.charCodeAt(0) - aCharCode;
|
|
|
|
|
if ( (lineBits & 0x04) !== 0 ) {
|
2016-08-13 22:42:58 +02:00
|
|
|
|
return;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
line = lineIter.next(1);
|
|
|
|
|
if ( (lineBits & 0x02) !== 0 ) {
|
|
|
|
|
line = decodeURIComponent(line);
|
|
|
|
|
}
|
|
|
|
|
if ( (lineBits & 0x01) !== 0 ) {
|
2017-03-11 19:55:47 +01:00
|
|
|
|
this.badFilters.add(line);
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
2017-05-19 14:45:19 +02:00
|
|
|
|
categoryBits = importInt(fieldIter.first(line));
|
|
|
|
|
tokenHash = importInt(fieldIter.next());
|
2017-05-12 16:35:11 +02:00
|
|
|
|
fdata = fieldIter.remainder();
|
2015-02-24 00:31:29 +01:00
|
|
|
|
|
2015-11-24 01:18:25 +01:00
|
|
|
|
// Special cases: delegate to more specialized engines.
|
|
|
|
|
// Redirect engine.
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( fdata.startsWith('=>\t') ) {
|
|
|
|
|
µb.redirectEngine.fromCompiledRule(fdata.slice(3));
|
2015-11-24 01:18:25 +01:00
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Plain static filters.
|
2015-02-24 00:31:29 +01:00
|
|
|
|
this.acceptedCount += 1;
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// Special treatment: data-holding filters are stored separately
|
|
|
|
|
// because they require special matching algorithm (unlike other
|
|
|
|
|
// filters, ALL hits must be reported).
|
|
|
|
|
if ( fdata.startsWith(dataFilterFid) ) {
|
|
|
|
|
if ( this.duplicateBuster.has(line) ) {
|
|
|
|
|
this.discardedCount += 1;
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
this.duplicateBuster.add(line);
|
2017-05-19 14:45:19 +02:00
|
|
|
|
entry = new FilterDataHolderEntry(categoryBits, tokenHash, fdata);
|
|
|
|
|
bucket = this.dataFilters.get(tokenHash);
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( bucket !== undefined ) {
|
|
|
|
|
entry.next = bucket;
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.dataFilters.set(tokenHash, entry);
|
2017-05-12 16:35:11 +02:00
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
2017-05-19 14:45:19 +02:00
|
|
|
|
bucket = this.categories.get(categoryBits);
|
2015-02-24 00:31:29 +01:00
|
|
|
|
if ( bucket === undefined ) {
|
2016-09-12 16:22:25 +02:00
|
|
|
|
bucket = new Map();
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.categories.set(categoryBits, bucket);
|
2015-02-24 00:31:29 +01:00
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
entry = bucket.get(tokenHash);
|
2015-02-24 00:31:29 +01:00
|
|
|
|
|
2017-05-19 14:45:19 +02:00
|
|
|
|
if ( tokenHash === this.dotTokenHash ) {
|
2015-02-24 00:31:29 +01:00
|
|
|
|
if ( entry === undefined ) {
|
2016-09-12 16:22:25 +02:00
|
|
|
|
entry = new FilterHostnameDict();
|
2017-05-19 14:45:19 +02:00
|
|
|
|
bucket.set(this.dotTokenHash, entry);
|
2015-02-24 00:31:29 +01:00
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( entry.add(fdata) === false ) {
|
2016-03-17 18:56:21 +01:00
|
|
|
|
this.discardedCount += 1;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
}
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
2016-09-12 16:22:25 +02:00
|
|
|
|
if ( this.duplicateBuster.has(line) ) {
|
2016-03-17 18:56:21 +01:00
|
|
|
|
this.discardedCount += 1;
|
2015-02-24 00:31:29 +01:00
|
|
|
|
continue;
|
|
|
|
|
}
|
2016-09-12 16:22:25 +02:00
|
|
|
|
this.duplicateBuster.add(line);
|
2015-03-05 01:36:09 +01:00
|
|
|
|
|
2017-05-19 14:45:19 +02:00
|
|
|
|
//this.tokenHistogram.set(tokenHash, (this.tokenHistogram.get(tokenHash) || 0) + 1);
|
2017-05-12 16:35:11 +02:00
|
|
|
|
|
|
|
|
|
filter = filterFromCompiledData(fdata);
|
2015-02-24 00:31:29 +01:00
|
|
|
|
if ( entry === undefined ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
bucket.set(tokenHash, filter);
|
2015-02-24 00:31:29 +01:00
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( entry.fidPrefix === buckerFilterFid ) {
|
2015-02-24 00:31:29 +01:00
|
|
|
|
entry.add(filter);
|
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
bucket.set(tokenHash, new FilterBucket(entry, filter));
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
//FilterContainer.prototype.tokenHistogram = new Map();
|
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-03-11 19:55:47 +01:00
|
|
|
|
FilterContainer.prototype.removeBadFilters = function() {
|
|
|
|
|
var lines = µb.setToArray(this.badFilters),
|
|
|
|
|
fieldIter = new µb.FieldIterator('\v'),
|
2017-05-19 14:45:19 +02:00
|
|
|
|
categoryBits, tokenHash, fdata, bucket, entry,
|
2017-03-11 19:55:47 +01:00
|
|
|
|
i = lines.length;
|
|
|
|
|
while ( i-- ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
categoryBits = importInt(fieldIter.first(lines[i]));
|
|
|
|
|
bucket = this.categories.get(categoryBits);
|
2017-03-11 19:55:47 +01:00
|
|
|
|
if ( bucket === undefined ) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
tokenHash = importInt(fieldIter.next());
|
|
|
|
|
entry = bucket.get(tokenHash);
|
2017-03-11 19:55:47 +01:00
|
|
|
|
if ( entry === undefined ) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
fdata = fieldIter.remainder();
|
2017-03-11 19:55:47 +01:00
|
|
|
|
if ( entry instanceof FilterBucket ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
entry.remove(fdata);
|
2017-03-11 19:55:47 +01:00
|
|
|
|
if ( entry.filters.length === 1 ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
bucket.set(tokenHash, entry.filters[0]);
|
2017-03-11 19:55:47 +01:00
|
|
|
|
}
|
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-03-21 13:23:21 +01:00
|
|
|
|
if ( entry instanceof FilterHostnameDict ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
entry.remove(fdata);
|
2017-03-21 13:23:21 +01:00
|
|
|
|
if ( entry.size === 0 ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
bucket.delete(tokenHash);
|
2017-03-21 13:23:21 +01:00
|
|
|
|
if ( bucket.size === 0 ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.categories.delete(categoryBits);
|
2017-03-21 13:23:21 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
continue;
|
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( entry.compile() === fdata ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
bucket.delete(tokenHash);
|
2017-03-21 13:23:21 +01:00
|
|
|
|
if ( bucket.size === 0 ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.categories.delete(categoryBits);
|
2017-03-21 13:23:21 +01:00
|
|
|
|
}
|
|
|
|
|
continue;
|
2017-03-11 19:55:47 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterContainer.prototype.matchAndFetchData = function(dataType, requestURL, out, outlog) {
|
|
|
|
|
if ( this.dataFilters.length === 0 ) { return; }
|
2015-06-09 16:27:08 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var url = this.urlTokenizer.setURL(requestURL);
|
2015-06-09 16:27:08 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
requestHostnameRegister = µb.URI.hostnameFromURI(url);
|
2015-06-09 16:27:08 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// We need to visit ALL the matching filters.
|
|
|
|
|
var toAddImportant = new Map(),
|
|
|
|
|
toAdd = new Map(),
|
|
|
|
|
toRemove = new Map();
|
2015-06-09 16:27:08 +02:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var entry, f,
|
2017-05-19 14:45:19 +02:00
|
|
|
|
tokenHashes = this.urlTokenizer.getTokens(),
|
|
|
|
|
tokenHash, tokenOffset,
|
2017-05-12 16:35:11 +02:00
|
|
|
|
i = 0;
|
2017-05-19 14:45:19 +02:00
|
|
|
|
while ( i < 32 ) {
|
|
|
|
|
tokenHash = tokenHashes[i++];
|
|
|
|
|
if ( tokenHash === 0 ) { break; }
|
|
|
|
|
tokenOffset = tokenHashes[i++];
|
|
|
|
|
entry = this.dataFilters.get(tokenHash);
|
2017-05-12 16:35:11 +02:00
|
|
|
|
while ( entry !== undefined ) {
|
|
|
|
|
f = entry.filter;
|
2017-05-19 14:45:19 +02:00
|
|
|
|
if ( f.match(url, tokenOffset) === true ) {
|
|
|
|
|
if ( entry.categoryBits & 0x001 ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
toRemove.set(f.dataStr, entry);
|
2017-05-19 14:45:19 +02:00
|
|
|
|
} else if ( entry.categoryBits & 0x002 ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
toAddImportant.set(f.dataStr, entry);
|
|
|
|
|
} else {
|
|
|
|
|
toAdd.set(f.dataStr, entry);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
entry = entry.next;
|
|
|
|
|
}
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
entry = this.dataFilters.get(this.noTokenHash);
|
2017-05-12 16:35:11 +02:00
|
|
|
|
while ( entry !== undefined ) {
|
|
|
|
|
f = entry.filter;
|
2017-05-19 14:45:19 +02:00
|
|
|
|
if ( f.match(url) === true ) {
|
|
|
|
|
if ( entry.categoryBits & 0x001 ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
toRemove.set(f.dataStr, entry);
|
2017-05-19 14:45:19 +02:00
|
|
|
|
} else if ( entry.categoryBits & 0x002 ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
toAddImportant.set(f.dataStr, entry);
|
|
|
|
|
} else {
|
|
|
|
|
toAdd.set(f.dataStr, entry);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
entry = entry.next;
|
2015-06-09 16:27:08 +02:00
|
|
|
|
}
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
if ( toAddImportant.size === 0 && toAdd.size === 0 ) { return; }
|
|
|
|
|
|
|
|
|
|
// Remove entries overriden by other filters.
|
|
|
|
|
var iter = toAddImportant.entries(),
|
|
|
|
|
k;
|
|
|
|
|
for (;;) {
|
|
|
|
|
entry = iter.next();
|
|
|
|
|
if ( entry.done === true ) { break; }
|
|
|
|
|
k = entry.value[0];
|
|
|
|
|
toAdd.delete(k);
|
|
|
|
|
toRemove.delete(k);
|
2015-06-09 16:27:08 +02:00
|
|
|
|
}
|
2017-05-12 16:35:11 +02:00
|
|
|
|
iter = toRemove.entries();
|
|
|
|
|
for (;;) {
|
|
|
|
|
entry = iter.next();
|
|
|
|
|
if ( entry.done === true ) { break; }
|
|
|
|
|
k = entry.value[0];
|
|
|
|
|
if ( k === '' ) {
|
|
|
|
|
toAdd.clear();
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
toAdd.delete(k);
|
2015-06-09 16:27:08 +02:00
|
|
|
|
}
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var logData;
|
|
|
|
|
iter = toAddImportant.entries();
|
|
|
|
|
for (;;) {
|
|
|
|
|
entry = iter.next();
|
|
|
|
|
if ( entry.done === true ) { break; }
|
|
|
|
|
out.push(entry.value[0]);
|
|
|
|
|
if ( outlog === undefined ) { continue; }
|
|
|
|
|
logData = entry.value[1].logData();
|
|
|
|
|
logData.source = 'static';
|
|
|
|
|
logData.result = 1;
|
|
|
|
|
outlog.push(logData);
|
|
|
|
|
}
|
|
|
|
|
iter = toAdd.entries();
|
|
|
|
|
for (;;) {
|
|
|
|
|
entry = iter.next();
|
|
|
|
|
if ( entry.done === true ) { break; }
|
|
|
|
|
out.push(entry.value[0]);
|
|
|
|
|
if ( outlog === undefined ) { continue; }
|
|
|
|
|
logData = entry.value[1].logData();
|
|
|
|
|
logData.source = 'static';
|
|
|
|
|
logData.result = 1;
|
|
|
|
|
outlog.push(logData);
|
|
|
|
|
}
|
|
|
|
|
if ( outlog !== undefined ) {
|
|
|
|
|
iter = toRemove.entries();
|
|
|
|
|
for (;;) {
|
|
|
|
|
entry = iter.next();
|
|
|
|
|
if ( entry.done === true ) { break; }
|
|
|
|
|
logData = entry.value[1].logData();
|
|
|
|
|
logData.source = 'static';
|
|
|
|
|
logData.result = 2;
|
|
|
|
|
outlog.push(logData);
|
|
|
|
|
}
|
2015-06-09 16:27:08 +02:00
|
|
|
|
}
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2016-09-12 16:22:25 +02:00
|
|
|
|
// bucket: Map
|
|
|
|
|
// url: string
|
|
|
|
|
|
2014-12-28 16:07:43 +01:00
|
|
|
|
FilterContainer.prototype.matchTokens = function(bucket, url) {
|
2015-02-05 00:06:31 +01:00
|
|
|
|
// Hostname-only filters
|
2017-05-19 14:45:19 +02:00
|
|
|
|
var f = bucket.get(this.dotTokenHash);
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( f !== undefined && f.match() ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.thRegister = this.dotTokenHash;
|
2015-06-09 16:27:08 +02:00
|
|
|
|
this.fRegister = f;
|
|
|
|
|
return true;
|
2015-02-05 00:06:31 +01:00
|
|
|
|
}
|
|
|
|
|
|
2017-05-19 14:45:19 +02:00
|
|
|
|
var tokenHashes = this.urlTokenizer.getTokens(),
|
|
|
|
|
tokenHash, tokenOffset,
|
2017-05-12 16:35:11 +02:00
|
|
|
|
i = 0;
|
2014-09-21 20:03:41 +02:00
|
|
|
|
for (;;) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
tokenHash = tokenHashes[i++];
|
|
|
|
|
if ( tokenHash === 0 ) { break; }
|
|
|
|
|
tokenOffset = tokenHashes[i++];
|
|
|
|
|
f = bucket.get(tokenHash);
|
|
|
|
|
if ( f !== undefined && f.match(url, tokenOffset) === true ) {
|
|
|
|
|
this.thRegister = tokenHash;
|
2015-06-09 16:27:08 +02:00
|
|
|
|
this.fRegister = f;
|
|
|
|
|
return true;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
|
|
|
|
}
|
2015-01-23 17:32:49 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// Untokenizable filters
|
2017-05-19 14:45:19 +02:00
|
|
|
|
f = bucket.get(this.noTokenHash);
|
|
|
|
|
if ( f !== undefined && f.match(url) === true ) {
|
|
|
|
|
this.thRegister = this.noTokenHash;
|
2015-06-09 16:27:08 +02:00
|
|
|
|
this.fRegister = f;
|
|
|
|
|
return true;
|
2015-01-23 17:32:49 +01:00
|
|
|
|
}
|
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
return false;
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2014-07-30 02:07:08 +02:00
|
|
|
|
// Specialized handlers
|
|
|
|
|
|
2016-11-08 13:13:26 +01:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/1477
|
|
|
|
|
// Special case: blocking-generichide filter ALWAYS exists, it is implicit --
|
|
|
|
|
// thus we always first check for exception filters, then for important block
|
|
|
|
|
// filter if and only if there was a hit on an exception filter.
|
|
|
|
|
// https://github.com/gorhill/uBlock/issues/2103
|
|
|
|
|
// User may want to override `generichide` exception filters.
|
|
|
|
|
|
|
|
|
|
FilterContainer.prototype.matchStringGenericHide = function(context, requestURL) {
|
|
|
|
|
var url = this.urlTokenizer.setURL(requestURL);
|
|
|
|
|
|
2016-12-08 02:18:58 +01:00
|
|
|
|
// https://github.com/gorhill/uBlock/issues/2225
|
|
|
|
|
// Important: this is used by FilterHostnameDict.match().
|
|
|
|
|
requestHostnameRegister = µb.URI.hostnameFromURI(url);
|
|
|
|
|
|
2017-05-16 16:25:00 +02:00
|
|
|
|
var bucket = this.categories.get(genericHideException);
|
2016-11-08 13:13:26 +01:00
|
|
|
|
if ( !bucket || this.matchTokens(bucket, url) === false ) {
|
|
|
|
|
this.fRegister = null;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 0;
|
2016-11-08 13:13:26 +01:00
|
|
|
|
}
|
|
|
|
|
|
2017-05-16 16:25:00 +02:00
|
|
|
|
bucket = this.categories.get(genericHideImportant);
|
2016-11-08 13:13:26 +01:00
|
|
|
|
if ( bucket && this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = genericHideImportant;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 1;
|
2016-11-08 13:13:26 +01:00
|
|
|
|
}
|
|
|
|
|
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = genericHideException;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 2;
|
2016-11-08 13:13:26 +01:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2015-04-07 03:26:05 +02:00
|
|
|
|
// https://github.com/chrisaljoudi/uBlock/issues/116
|
2016-11-08 13:13:26 +01:00
|
|
|
|
// Some type of requests are exceptional, they need custom handling,
|
|
|
|
|
// not the generic handling.
|
2014-07-30 03:10:00 +02:00
|
|
|
|
|
2014-12-28 16:07:43 +01:00
|
|
|
|
FilterContainer.prototype.matchStringExactType = function(context, requestURL, requestType) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
// Special cases.
|
2016-11-08 13:13:26 +01:00
|
|
|
|
if ( requestType === 'generichide' ) {
|
|
|
|
|
return this.matchStringGenericHide(context, requestURL);
|
|
|
|
|
}
|
2016-08-31 11:19:16 +02:00
|
|
|
|
var type = typeNameToTypeValue[requestType];
|
|
|
|
|
if ( type === undefined ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 0;
|
2015-03-26 00:28:22 +01:00
|
|
|
|
}
|
|
|
|
|
|
2015-12-29 17:34:41 +01:00
|
|
|
|
// Prime tokenizer: we get a normalized URL in return.
|
|
|
|
|
var url = this.urlTokenizer.setURL(requestURL);
|
|
|
|
|
|
|
|
|
|
// These registers will be used by various filters
|
|
|
|
|
pageHostnameRegister = context.pageHostname || '';
|
|
|
|
|
requestHostnameRegister = µb.URI.hostnameFromURI(url);
|
|
|
|
|
|
2016-11-08 13:13:26 +01:00
|
|
|
|
var party = isFirstParty(context.pageDomain, requestHostnameRegister) ? FirstParty : ThirdParty,
|
|
|
|
|
categories = this.categories,
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits, bucket;
|
2014-09-21 20:03:41 +02:00
|
|
|
|
|
2015-06-09 16:27:08 +02:00
|
|
|
|
this.fRegister = null;
|
|
|
|
|
|
2015-04-07 03:26:05 +02:00
|
|
|
|
// https://github.com/chrisaljoudi/uBlock/issues/139
|
2016-11-08 13:13:26 +01:00
|
|
|
|
// Test against important block filters
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAnyParty | Important | type;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 1;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAction | Important | type | party;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 1;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
2014-08-29 21:02:31 +02:00
|
|
|
|
}
|
|
|
|
|
|
2016-03-16 17:11:37 +01:00
|
|
|
|
// Test against block filters
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAnyParty | type;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2016-03-16 17:11:37 +01:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2016-03-16 17:11:37 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if ( this.fRegister === null ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAction | type | party;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2016-03-16 17:11:37 +01:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2016-03-16 17:11:37 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// If there is no block filter, no need to test against allow filters
|
|
|
|
|
if ( this.fRegister === null ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 0;
|
2016-03-16 17:11:37 +01:00
|
|
|
|
}
|
|
|
|
|
|
2014-07-30 02:07:08 +02:00
|
|
|
|
// Test against allow filters
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = AllowAnyParty | type;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 2;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = AllowAction | type | party;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 2;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
2014-07-30 02:07:08 +02:00
|
|
|
|
}
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 1;
|
2014-07-30 02:07:08 +02:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2014-12-28 16:07:43 +01:00
|
|
|
|
FilterContainer.prototype.matchString = function(context) {
|
2015-04-07 03:26:05 +02:00
|
|
|
|
// https://github.com/chrisaljoudi/uBlock/issues/519
|
2015-01-17 13:53:19 +01:00
|
|
|
|
// Use exact type match for anything beyond `other`
|
2015-01-21 01:39:13 +01:00
|
|
|
|
// Also, be prepared to support unknown types
|
2016-08-31 04:45:24 +02:00
|
|
|
|
var type = typeNameToTypeValue[context.requestType];
|
|
|
|
|
if ( type === undefined ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
type = otherTypeBitValue;
|
|
|
|
|
} else if ( type === 0 || type > otherTypeBitValue ) {
|
2015-01-17 13:53:19 +01:00
|
|
|
|
return this.matchStringExactType(context, context.requestURL, context.requestType);
|
|
|
|
|
}
|
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
// The logic here is simple:
|
|
|
|
|
//
|
|
|
|
|
// block = !whitelisted && blacklisted
|
|
|
|
|
// or equivalent
|
|
|
|
|
// allow = whitelisted || !blacklisted
|
|
|
|
|
|
2014-06-28 17:40:26 +02:00
|
|
|
|
// Statistically, hits on a URL in order of likelihood:
|
|
|
|
|
// 1. No hit
|
|
|
|
|
// 2. Hit on a block filter
|
|
|
|
|
// 3. Hit on an allow filter
|
|
|
|
|
//
|
|
|
|
|
// High likelihood of "no hit" means to optimize we need to reduce as much
|
|
|
|
|
// as possible the number of filters to test.
|
|
|
|
|
//
|
|
|
|
|
// Then, because of the order of probabilities, we should test only
|
2014-10-17 21:44:19 +02:00
|
|
|
|
// block filters first, and test allow filters if and only if there is a
|
2014-06-28 17:40:26 +02:00
|
|
|
|
// hit on a block filter. Since there is a high likelihood of no hit,
|
|
|
|
|
// testing allow filter by default is likely wasted work, hence allow
|
2014-06-28 17:41:49 +02:00
|
|
|
|
// filters are tested *only* if there is a (unlikely) hit on a block
|
|
|
|
|
// filter.
|
2014-06-24 00:42:43 +02:00
|
|
|
|
|
2015-12-29 17:34:41 +01:00
|
|
|
|
// Prime tokenizer: we get a normalized URL in return.
|
|
|
|
|
var url = this.urlTokenizer.setURL(context.requestURL);
|
2014-10-07 22:30:40 +02:00
|
|
|
|
|
2015-02-05 00:06:31 +01:00
|
|
|
|
// These registers will be used by various filters
|
|
|
|
|
pageHostnameRegister = context.pageHostname || '';
|
|
|
|
|
requestHostnameRegister = context.requestHostname;
|
2014-10-07 04:40:25 +02:00
|
|
|
|
|
2015-06-09 16:27:08 +02:00
|
|
|
|
this.fRegister = null;
|
2015-01-21 14:59:23 +01:00
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
var party = isFirstParty(context.pageDomain, context.requestHostname)
|
|
|
|
|
? FirstParty
|
|
|
|
|
: ThirdParty;
|
|
|
|
|
var categories = this.categories,
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits, bucket;
|
2015-06-09 23:01:31 +02:00
|
|
|
|
|
2015-04-07 03:26:05 +02:00
|
|
|
|
// https://github.com/chrisaljoudi/uBlock/issues/139
|
2014-08-29 21:02:31 +02:00
|
|
|
|
// Test against important block filters.
|
|
|
|
|
// The purpose of the `important` option is to reverse the order of
|
|
|
|
|
// evaluation. Normally, it is "evaluate block then evaluate allow", with
|
|
|
|
|
// the `important` property it is "evaluate allow then evaluate block".
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAnyTypeAnyParty | Important;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 1;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAnyType | Important | party;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 1;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAnyParty | Important | type;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 1;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAction | Important | type | party;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 1;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
2014-08-29 21:02:31 +02:00
|
|
|
|
}
|
|
|
|
|
|
2014-06-24 00:42:43 +02:00
|
|
|
|
// Test against block filters
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAnyTypeAnyParty;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.fRegister === null ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAnyType | party;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2015-06-09 16:27:08 +02:00
|
|
|
|
}
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.fRegister === null ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAnyParty | type;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2015-06-09 16:27:08 +02:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
if ( this.fRegister === null ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = BlockAction | type | party;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2015-06-09 16:27:08 +02:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// If there is no block filter, no need to test against allow filters
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.fRegister === null ) {
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 0;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Test against allow filters
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = AllowAnyTypeAnyParty;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 2;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = AllowAnyType | party;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 2;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = AllowAnyParty | type;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 2;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
|
|
|
|
}
|
2017-05-19 14:45:19 +02:00
|
|
|
|
catBits = AllowAction | type | party;
|
|
|
|
|
if ( (bucket = categories.get(catBits)) ) {
|
2015-06-09 16:27:08 +02:00
|
|
|
|
if ( this.matchTokens(bucket, url) ) {
|
2017-05-19 14:45:19 +02:00
|
|
|
|
this.cbRegister = catBits;
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 2;
|
2014-12-28 16:07:43 +01:00
|
|
|
|
}
|
2014-06-24 00:42:43 +02:00
|
|
|
|
}
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return 1;
|
2015-06-09 16:27:08 +02:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
2017-05-12 16:35:11 +02:00
|
|
|
|
FilterContainer.prototype.toLogData = function() {
|
|
|
|
|
if ( this.fRegister === null ) { return; }
|
2017-05-19 14:45:19 +02:00
|
|
|
|
var logData = toLogDataInternal(this.cbRegister, this.thRegister, this.fRegister);
|
2017-05-12 16:35:11 +02:00
|
|
|
|
logData.source = 'static';
|
2017-05-19 14:45:19 +02:00
|
|
|
|
logData.tokenHash = this.thRegister;
|
|
|
|
|
logData.result = this.fRegister === null ? 0 : (this.cbRegister & 1 ? 2 : 1);
|
2017-05-12 16:35:11 +02:00
|
|
|
|
return logData;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
FilterContainer.prototype.getFilterCount = function() {
|
2016-03-17 18:56:21 +01:00
|
|
|
|
return this.acceptedCount - this.discardedCount;
|
2014-06-24 00:42:43 +02:00
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
return new FilterContainer();
|
|
|
|
|
|
|
|
|
|
/******************************************************************************/
|
|
|
|
|
|
|
|
|
|
})();
|