From b696fbc25595063df3b05c73d7574c18450a8bed Mon Sep 17 00:00:00 2001 From: GlazerMann Date: Fri, 27 Dec 2024 08:34:47 -0600 Subject: [PATCH] add a bunch --- constants/bad_data.php | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) diff --git a/constants/bad_data.php b/constants/bad_data.php index 72b136aa05..7ad055c57a 100644 --- a/constants/bad_data.php +++ b/constants/bad_data.php @@ -569,6 +569,16 @@ const CANONICAL_PUBLISHER_URLS = [ '.acm.org', + 'archivespp.pl', + 'radicalphilosophy.com', + '.erudit.org', + 'metropolitics.org', + 'metropolitiques.eu', + 'revistas.upr.edu', + '.tci-thaijo.org', + 'tidsskrift.dk', + 'observatoria.rsl.ru', + 'britishartstudies.ac.uk', '.oup.com', 'academic.oup.com', 'aeaweb.org', @@ -616,10 +626,14 @@ 'psycnet.apa.org', 'publications.aap.org', 'pubs.geoscienceworld.org', + 'muse.jhu.edu', 'pubs.rsc.org', + 'xlink.rsc.org', 'sagepub.com', 'sagepublications.com', 'scholarpedia.org', + 'arc.aiaa.org', + 'bmcr.brynmawr.edu', 'schweizerbart.de', 'scielo.br', 'scielo.org', @@ -627,6 +641,7 @@ 'sciencemag.org', 'springer.com', 'tandfonline.com', + 'pyglobal.com', 'taylorandfrancis.com', 'thelancet.com', 'vertpala.ac.cn', @@ -653,6 +668,8 @@ 'perspectivia.net', 'shs.cairn.info', 'zaguan.unizar.es', + 'numdam.org', + 'works.bepress.com', ]; const PROXY_HOSTS_TO_ALWAYS_DROP = [ @@ -1134,6 +1151,7 @@ 'kijkcijferanalyse\.nl/', // highjacked ]; const NON_JOURNAL_WEBSITES = [ + 'ourworldindata.org/', '-news.co.uk/', '.ajc.com/', '.al.com/',