bypass-paywalls-firefox-clean/background.js

497 lines
14 KiB
JavaScript
Raw Normal View History

2017-07-08 19:40:29 +02:00
'use strict';
var defaultSites = {
'Algemeen Dagblad': 'ad.nl',
2017-07-08 19:40:29 +02:00
'Baltimore Sun': 'baltimoresun.com',
'Barron\'s': 'barrons.com',
2018-05-06 02:53:07 +02:00
'Bloomberg': 'bloomberg.com',
2019-10-06 19:28:35 +02:00
'Bloomberg Quint': 'bloombergquint.com',
2018-07-08 00:11:09 +02:00
'Business Insider': 'businessinsider.com',
'Caixin Global': 'caixinglobal.com',
2019-01-05 20:39:45 +01:00
'Chemical & Engineering News': 'cen.acs.org',
2017-07-08 19:40:29 +02:00
'Chicago Tribune': 'chicagotribune.com',
'Central Western Daily': 'centralwesterndaily.com.au',
'Crain\'s Chicago Business': 'chicagobusiness.com',
2018-04-06 08:22:58 +02:00
'Corriere Della Sera': 'corriere.it',
2017-07-08 19:40:29 +02:00
'Daily Press': 'dailypress.com',
'DeMorgen': 'demorgen.be',
2018-07-05 03:46:28 +02:00
'Denver Post': 'denverpost.com',
'De Tijd': 'tijd.be',
'De Groene Amsterdammer': 'groene.nl',
'de Volkskrant': 'volkskrant.nl',
2019-12-08 06:49:23 +01:00
'ET Prime': 'prime.economictimes.indiatimes.com',
2017-07-08 19:40:29 +02:00
'The Economist': 'economist.com',
'Eindhovens Dagblad': 'ed.nl',
2017-07-08 19:40:29 +02:00
'Financial Times': 'ft.com',
'Foreign Policy': 'foreignpolicy.com',
2017-07-08 19:40:29 +02:00
'Glassdoor': 'glassdoor.com',
'Haaretz': 'haaretz.co.il',
2018-04-23 11:20:40 +02:00
'Haaretz English': 'haaretz.com',
'Handelsblatt': 'handelsblatt.com',
'Harper\'s Magazine': 'harpers.org',
2017-07-08 19:40:29 +02:00
'Hartford Courant': 'courant.com',
'Harvard Business Review': 'hbr.org',
'Inc.com': 'inc.com',
2019-03-10 21:03:53 +01:00
'Investors Chronicle': 'investorschronicle.co.uk',
'L\'Echo': 'lecho.be',
2018-12-06 22:23:04 +01:00
'La Repubblica': 'repubblica.it',
'Le Monde': 'lemonde.fr',
'Le Parisien': 'leparisien.fr',
'Le Temps': 'letemps.ch',
'Les Echos': 'lesechos.fr',
'London Review of Books': 'lrb.co.uk',
2017-07-08 19:40:29 +02:00
'Los Angeles Times': 'latimes.com',
2018-01-31 06:08:11 +01:00
'Medium': 'medium.com',
2017-07-08 19:40:29 +02:00
'Medscape': 'medscape.com',
'MIT Technology Review': 'technologyreview.com',
2018-10-29 05:44:18 +01:00
'Mountain View Voice': 'mv-voice.com',
'National Post': 'nationalpost.com',
2018-07-23 03:55:35 +02:00
'New Statesman': 'newstatesman.com',
2019-02-19 02:25:35 +01:00
'New York Magazine': 'nymag.com',
2020-01-05 16:48:54 +01:00
'New Zealand Herald': 'nzherald.co.nz',
2020-01-05 16:52:24 +01:00
'Newcastle Herald': 'newcastleherald.com.au',
2017-07-08 19:40:29 +02:00
'Nikkei Asian Review': 'asia.nikkei.com',
2019-12-07 22:26:58 +01:00
'NK News': 'nknews.org',
2017-07-08 19:40:29 +02:00
'NRC': 'nrc.nl',
2018-10-29 05:44:18 +01:00
'Orange County Register': 'ocregister.com',
'Orlando Sentinel': 'orlandosentinel.com',
'Palo Alto Online': 'paloaltoonline.com',
'Parool': 'parool.nl',
2019-09-30 03:18:59 +02:00
'Quartz': 'qz.com',
2018-10-29 05:44:18 +01:00
'Quora': 'quora.com',
'Scientific American': 'scientificamerican.com',
2020-01-05 17:41:06 +01:00
'Scribd': 'scribd.com',
2019-07-11 19:48:40 +02:00
'Statista': 'statista.com',
2018-10-29 05:44:18 +01:00
'SunSentinel': 'sun-sentinel.com',
2020-01-05 16:31:22 +01:00
'Tech in Asia': 'techinasia.com',
'Telegraaf': 'telegraaf.nl',
2018-10-02 03:52:35 +02:00
'The Advocate': 'theadvocate.com.au',
'The Age': 'theage.com.au',
2020-01-05 13:02:44 +01:00
'The Athletic': 'theathletic.com',
2019-09-30 02:47:26 +02:00
'The Atlantic': 'theatlantic.com',
'The Australian': 'theaustralian.com.au',
2018-12-18 08:45:33 +01:00
'The Australian Financial Review': 'afr.com',
2019-09-30 02:27:24 +02:00
'The Boston Globe': 'bostonglobe.com',
2018-06-30 21:48:40 +02:00
'The Business Journals': 'bizjournals.com',
2019-05-13 01:40:27 +02:00
'The Diplomat': 'thediplomat.com',
2020-01-05 18:19:48 +01:00
'The Examiner': 'examiner.com.au',
'The Globe and Mail': 'theglobeandmail.com',
'The Herald': 'theherald.com.au',
2019-11-02 12:20:28 +01:00
'The Hindu': 'thehindu.com',
2018-09-09 22:21:36 +02:00
'The Japan Times': 'japantimes.co.jp',
2018-10-29 05:44:18 +01:00
'TheMarker': 'themarker.com',
2019-10-29 00:25:53 +01:00
'The Mercury Tasmania': 'themercury.com.au',
2018-01-31 06:08:11 +01:00
'The Mercury News': 'mercurynews.com',
2017-07-08 19:40:29 +02:00
'The Morning Call': 'mcall.com',
'The Nation': 'thenation.com',
'The New York Times': 'nytimes.com',
'The New Yorker': 'newyorker.com',
2019-01-05 20:39:45 +01:00
'The News-Gazette': 'news-gazette.com',
'The Philadelphia Inquirer': 'inquirer.com',
'The Saturday Paper': 'thesaturdaypaper.com.au',
2018-07-23 04:04:27 +02:00
'The Spectator': 'spectator.co.uk',
2017-07-08 19:40:29 +02:00
'The Seattle Times': 'seattletimes.com',
'The Sydney Morning Herald': 'smh.com.au',
'The Telegraph': 'telegraph.co.uk',
'The Times': 'thetimes.co.uk',
2018-08-29 01:15:23 +02:00
'The Toronto Star': 'thestar.com',
2017-07-08 19:40:29 +02:00
'The Washington Post': 'washingtonpost.com',
2018-06-03 20:23:04 +02:00
'The Wall Street Journal': 'wsj.com',
2019-12-05 21:32:20 +01:00
'Times Literary Supplement': 'the-tls.co.uk',
'Towards Data Science': 'towardsdatascience.com',
'Trouw': 'trouw.nl',
'Vanity Fair': 'vanityfair.com',
'Vrij Nederland': 'vn.nl',
'Wired': 'wired.com',
2017-07-08 19:40:29 +02:00
};
2018-01-31 06:08:11 +01:00
const restrictions = {
'barrons.com': /.+barrons\.com\/articles\/.+/,
'prime.economictimes.indiatimes.com': /.+prime\.economictimes\.indiatimes\.com\/news\/[0-9]{8}\/.+/,
'wsj.com': /.+wsj\.com\/articles\/.+/
2017-07-08 19:40:29 +02:00
}
// Don't remove cookies before page load
2018-01-31 06:08:11 +01:00
const allow_cookies = [
'ad.nl',
2017-07-08 19:40:29 +02:00
'asia.nikkei.com',
'barrons.com',
2019-09-30 02:27:24 +02:00
'bostonglobe.com',
'caixinglobal.com',
2019-10-29 14:05:40 +01:00
'cen.acs.org',
'chicagobusiness.com',
'demorgen.be',
2018-07-05 03:46:28 +02:00
'denverpost.com',
'economist.com',
'ed.nl',
2018-10-07 07:18:34 +02:00
'examiner.com.au',
'ft.com',
'haaretz.co.il',
'haaretz.com',
'hacked.com',
'harpers.org',
2019-02-11 00:43:12 +01:00
'hbr.org',
'lecho.be',
'lemonde.fr',
'lesechos.fr',
'letemps.ch',
'medium.com',
'mercurynews.com',
'newstatesman.com',
2019-02-19 02:25:35 +01:00
'nymag.com',
'nytimes.com',
'ocregister.com',
'parool.nl',
'quora.com',
2019-10-23 13:52:04 +02:00
'qz.com',
'scientificamerican.com',
2020-01-05 17:41:06 +01:00
'scribd.com',
'spectator.co.uk',
'telegraaf.nl',
'telegraph.co.uk',
'theadvocate.com.au',
2019-10-29 14:05:40 +01:00
'theage.com.au',
2020-01-05 13:02:44 +01:00
'theathletic.com',
2019-11-13 12:35:23 +01:00
'theatlantic.com',
'theaustralian.com.au',
2019-10-29 14:05:40 +01:00
'thediplomat.com',
'themarker.com',
2019-10-29 00:25:53 +01:00
'themercury.com.au',
'thestar.com',
'thetimes.co.uk',
'towardsdatascience.com',
'trouw.nl',
'vn.nl',
'volkskrant.nl',
'washingtonpost.com',
'wsj.com',
2017-07-08 19:40:29 +02:00
]
// Removes cookies after page load
2018-01-31 06:08:11 +01:00
const remove_cookies = [
'ad.nl',
2017-07-08 19:40:29 +02:00
'asia.nikkei.com',
'bloombergquint.com',
2019-09-30 02:27:24 +02:00
'bostonglobe.com',
'caixinglobal.com',
2019-10-29 14:05:40 +01:00
'cen.acs.org',
'chicagobusiness.com',
'demorgen.be',
2018-07-05 03:46:28 +02:00
'denverpost.com',
'economist.com',
'ed.nl',
'examiner.com.au',
'ft.com',
'hacked.com',
'harpers.org',
'hbr.org',
'lecho.be',
'lesechos.fr',
'letemps.ch',
'medium.com',
'mercurynews.com',
2018-07-23 04:04:27 +02:00
'newstatesman.com',
'nymag.com',
'ocregister.com',
2019-10-23 13:52:04 +02:00
'qz.com',
'scientificamerican.com',
'spectator.co.uk',
'telegraaf.nl',
2018-09-28 16:39:45 +02:00
'theadvocate.com.au',
2019-10-29 14:05:40 +01:00
'theage.com.au',
2019-11-13 12:35:23 +01:00
'theatlantic.com',
2019-10-29 14:05:40 +01:00
'thediplomat.com',
'thestar.com',
'towardsdatascience.com',
'vn.nl',
'washingtonpost.com',
2017-07-08 19:40:29 +02:00
]
// select specific cookie(s) to hold from remove_cookies domains
const remove_cookies_select_hold = {
'washingtonpost.com': ['wp_gdpr'],
'qz.com': ['gdpr']
}
// select only specific cookie(s) to drop from remove_cookies domains
const remove_cookies_select_drop = {
'ad.nl': ['temptationTrackingId'],
'bostonglobe.com': ['FMPaywall'],
'caixinglobal.com': ['CAIXINGLB_LOGIN_UUID'],
'demorgen.be': ['TID_ID'],
'economist.com': ['rvuuid'],
'ed.nl': ['temptationTrackingId'],
'nrc.nl': ['counter']
}
// Override User-Agent with Googlebot
const use_google_bot = [
'barrons.com',
2020-01-05 13:02:44 +01:00
'haaretz.co.il',
'haaretz.com',
'lemonde.fr',
2020-01-05 13:02:44 +01:00
'nknews.org',
'prime.economictimes.indiatimes.com',
'quora.com',
'telegraph.co.uk',
2020-01-05 13:02:44 +01:00
'theathletic.com',
'theaustralian.com.au',
2020-01-05 13:02:44 +01:00
'themarker.com',
2019-10-29 00:25:53 +01:00
'themercury.com.au',
'thetimes.co.uk',
2019-12-07 22:26:58 +01:00
'wsj.com',
]
2017-07-08 19:40:29 +02:00
function setDefaultOptions() {
browser.storage.sync.set({
sites: defaultSites
}, function() {
browser.runtime.openOptionsPage();
});
}
// to block external script also add domain to manifest.json (permissions)
const blockedRegexes = {
'chicagotribune.com': /.+:\/\/.+\.tribdss\.com\//,
'thenation.com': /thenation\.com\/.+\/paywall-script\.php/,
'haaretz.co.il': /haaretz\.co\.il\/htz\/js\/inter\.js/,
'nzherald.co.nz': /nzherald\.co\.nz\/.+\/headjs\/.+\.js/,
'economist.com': /.+\.tinypass\.com\/.+/,
'lrb.co.uk': /.+\.tinypass\.com\/.+/,
'bostonglobe.com': /meter\.bostonglobe\.com\/js\/.+/,
'foreignpolicy.com': /.+\.tinypass\.com\/.+/,
'inquirer.com': /.+\.tinypass\.com\/.+/,
2020-01-05 16:48:54 +01:00
'spectator.co.uk': /.+\.tinypass\.com\/.+/,
'newcastleherald.com.au': /.+cdn-au\.piano\.io\/api\/tinypass.+\.js/,
'afr.com': /afr\.com\/assets\/vendorsReactRedux_client.+\.js/,
'theglobeandmail.com': /theglobeandmail\.com\/pb\/resources\/scripts\/build\/chunk-bootstraps\/.+\.js/,
'leparisien.fr': /.+\.tinypass\.com\/.+/,
'lesechos.fr': /.+\.tinypass\.com\/.+/,
'nytimes.com': /(.+meter-svc\.nytimes\.com\/meter\.js.+|.+mwcm\.nyt\.com\/.+\.js)/
};
2017-07-08 19:40:29 +02:00
const userAgentDesktop = "Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html)"
const userAgentMobile = "Chrome/41.0.2272.96 Mobile Safari/537.36 (compatible ; Googlebot/2.1 ; +http://www.google.com/bot.html)"
2017-07-08 19:40:29 +02:00
var enabledSites = [];
// Get the enabled sites
browser.storage.sync.get({
sites: {}
}, function(items) {
var sites = items.sites;
enabledSites = Object.keys(items.sites).map(function(key) {
return items.sites[key];
});
});
// Listen for changes to options
browser.storage.onChanged.addListener(function(changes, namespace) {
var key;
for (key in changes) {
var storageChange = changes[key];
if (key === 'sites') {
var sites = storageChange.newValue;
enabledSites = Object.keys(sites).map(function(key) {
return sites[key];
});
}
}
});
// Set and show default options on install
browser.runtime.onInstalled.addListener(function(details) {
2017-07-08 19:40:29 +02:00
if (details.reason == "install") {
setDefaultOptions();
} else if (details.reason == "update") {
// User updated extension
}
});
// Disable javascript for these sites
chrome.webRequest.onBeforeRequest.addListener(function(details) {
if (!isSiteEnabled(details) || details.url.indexOf("mod=rsswn") !== -1) {
return;
}
return {cancel: true};
},
{
urls: ["*://*.newstatesman.com/*"],
types: ["script"]
},
["blocking"]
);
2019-02-11 00:43:12 +01:00
browser.webRequest.onBeforeSendHeaders.addListener(function(details) {
var requestHeaders = details.requestHeaders;
var header_referer = '';
for (var n in requestHeaders) {
if (requestHeaders[n].name.toLowerCase() == 'referer') {
header_referer = requestHeaders[n].value;
continue;
}
}
// check for blocked regular expression: domain enabled, match regex, block on an internal or external regex
for (var domain in blockedRegexes) {
if ((isSiteEnabled({url: '.'+ domain}) || isSiteEnabled({url: header_referer})) && details.url.match(blockedRegexes[domain])) {
if (details.url.indexOf(domain) !== -1 || header_referer.indexOf(domain) !== -1) {
// allow BG paywall-script to set cookies in homepage/sections (else no article-text)
if (details.url.indexOf('meter.bostonglobe.com/js/') !== -1 && (header_referer === 'https://www.bostonglobe.com/'
|| header_referer.indexOf('/?p1=BGHeader_') !== -1 || header_referer.indexOf('/?p1=BGMenu_') !== -1)) {
break;
}
return { cancel: true };
}
}
2017-07-08 19:40:29 +02:00
}
if (!isSiteEnabled(details)) {
return;
2018-11-24 23:10:21 +01:00
}
2017-07-08 19:40:29 +02:00
var tabId = details.tabId;
var useUserAgentMobile = false;
2017-07-08 19:40:29 +02:00
var setReferer = false;
// if referer exists, set it to google
requestHeaders = requestHeaders.map(function(requestHeader) {
2017-07-08 19:40:29 +02:00
if (requestHeader.name === 'Referer') {
if (details.url.indexOf("cooking.nytimes.com/api/v1/users/bootstrap") !== -1) {
// this fixes images not being loaded on cooking.nytimes.com main page
// referrer has to be *nytimes.com otherwise returns 403
requestHeader.value = 'https://cooking.nytimes.com';
2019-02-21 04:37:08 +01:00
} else if (details.url.indexOf("wsj.com") !== -1 || details.url.indexOf("ft.com") !== -1) {
requestHeader.value = 'https://www.facebook.com/';
} else {
requestHeader.value = 'https://www.google.com/';
}
setReferer = true;
}
if (requestHeader.name === 'User-Agent') {
useUserAgentMobile = requestHeader.value.toLowerCase().includes("mobile");
}
return requestHeader;
});
2017-07-08 19:40:29 +02:00
// otherwise add it
if (!setReferer) {
if (details.url.indexOf("wsj.com") !== -1) {
requestHeaders.push({
name: 'Referer',
value: 'https://www.facebook.com/'
});
} else {
requestHeaders.push({
name: 'Referer',
value: 'https://www.google.com/'
});
}
}
2017-07-08 19:40:29 +02:00
// override User-Agent to use Googlebot
var useGoogleBot = use_google_bot.filter(function(item) {
return typeof item == 'string' && details.url.indexOf(item) > -1;
}).length > 0;
if (useGoogleBot) {
requestHeaders.push({
"name": "User-Agent",
"value": useUserAgentMobile ? userAgentMobile : userAgentDesktop
})
requestHeaders.push({
"name": "X-Forwarded-For",
"value": "66.249.66.1"
})
2017-07-08 19:40:29 +02:00
}
// remove cookies before page load
requestHeaders = requestHeaders.map(function(requestHeader) {
for (var siteIndex in allow_cookies) {
if (details.url.indexOf(allow_cookies[siteIndex]) !== -1) {
return requestHeader;
}
}
if (requestHeader.name === 'Cookie') {
requestHeader.value = '';
}
return requestHeader;
});
if (tabId !== -1) {
// run contentScript inside tab
browser.tabs.executeScript(tabId, {
file: 'contentScript.js',
runAt: 'document_start'
}, function(res) {
if (browser.runtime.lastError || res[0]) {
return;
}
});
}
return { requestHeaders: requestHeaders };
}, {
urls: ['<all_urls>']
}, ['blocking', 'requestHeaders']);
// remove cookies after page load
browser.webRequest.onCompleted.addListener(function(details) {
for (var domainIndex in remove_cookies) {
var domainVar = remove_cookies[domainIndex];
if (!enabledSites.includes(domainVar) || details.url.indexOf(domainVar) === -1) {
continue; // don't remove cookies
}
browser.cookies.getAll({domain: domainVar}, function(cookies) {
for (var i=0; i<cookies.length; i++) {
2018-10-19 06:28:29 +02:00
var cookie = {
url: (cookies[i].secure ? "https://" : "http://") + cookies[i].domain + cookies[i].path,
name: cookies[i].name,
storeId: cookies[i].storeId
};
if (cookies[i].firstPartyDomain !== undefined) {
cookie.firstPartyDomain = cookies[i].firstPartyDomain;
}
var cookie_domain = cookies[i].domain;
var rc_domain = cookie_domain.replace(/^(\.?www\.|\.)/, '');
// hold specific cookie(s) from remove_cookies domains
if ((rc_domain in remove_cookies_select_hold) && remove_cookies_select_hold[rc_domain].includes(cookies[i].name)){
continue; // don't remove specific cookie
}
// drop only specific cookie(s) from remove_cookies domains
if ((rc_domain in remove_cookies_select_drop) && !(remove_cookies_select_drop[rc_domain].includes(cookies[i].name))){
continue; // only remove specific cookie
}
2018-10-19 06:28:29 +02:00
browser.cookies.remove(cookie);
2017-07-08 19:40:29 +02:00
}
});
}
}, {
urls: ["<all_urls>"]
2018-08-29 01:15:23 +02:00
});
2019-02-11 00:43:12 +01:00
function isSiteEnabled(details) {
var isEnabled = enabledSites.some(function(enabledSite) {
var useSite = (details.url.indexOf("." + enabledSite) !== -1 || details.url.indexOf("/" + enabledSite) !== -1);
2019-02-11 00:43:12 +01:00
if (enabledSite in restrictions) {
return useSite && details.url.match(restrictions[enabledSite]);
2019-02-11 00:43:12 +01:00
}
return useSite;
});
return isEnabled;
}
function getParameterByName(name, url) {
if (!url) url = window.location.href;
name = name.replace(/[\[\]]/g, '\\$&');
var regex = new RegExp('[?&]' + name + '(=([^&#]*)|&|#|$)'),
results = regex.exec(url);
if (!results) return null;
if (!results[2]) return '';
return decodeURIComponent(results[2].replace(/\+/g, ' '));
}