Skip to content

Commit

Permalink
Update bad_data.php
Browse files Browse the repository at this point in the history
  • Loading branch information
GlazerMann authored Dec 29, 2024
1 parent d7366f2 commit fa88eb5
Showing 1 changed file with 26 additions and 2 deletions.
28 changes: 26 additions & 2 deletions constants/bad_data.php
Original file line number Diff line number Diff line change
Expand Up @@ -574,6 +574,7 @@
'.ebscohost.com',
'.erudit.org',
'.ezproxy.',
'.hbr.org',
'.oup.com',
'.serialssolutions.com',
'.tci-thaijo.org',
Expand All @@ -597,8 +598,10 @@
'chestjournal.org',
'chestpubs.org',
'clinchem.org',
'computationalculture.net',
'degruyter.com',
'doi.apa.org',
'doi.library.ubc.ca',
'elsevier.com',
'emerald.com',
'emeraldinsight.com',
Expand All @@ -607,23 +610,25 @@
'frontiersin.org',
'fundacionmenteclara.org.ar',
'gsapubs.org',
'.hbr.org',
'heinonline.org/HOL/LandingPage?collection=journals',
'heinonline.org/HOL/LandingPage?handle=hein.journals',
'hindawi.com',
'hrcak.srce.hr',
'icce-ojs-tamu.tdl.org',
'ieeexplore.ieee.org',
'inderscience.com',
'interstices.ac.nz',
'iopscience.iop.org',
'iospress.com',
'iospress.nl',
'jamanetwork.com/journals',
'josis.org',
'journal.chestnet.org',
'journals.ametsoc.org',
'journals.ku.edu',
'journals.openedition.org',
'journals.royalsociety.org',
'journals.tdl.org',
'journals.uchicago.edu',
'journals.upress.ufl.edu',
'jwildlifedis.org',
Expand All @@ -634,11 +639,15 @@
'msptm.org',
'muse.jhu.edu',
'nature.com',
'neurology.org',
'noormags.com',
'noormags.ir',
'nrcresearchpress.',
'observatoria.rsl.ru',
'pensoft.net/journals',
'pipss.revues.org',
'placesjournal.org',
'plc.revues.org',
'pnas.org',
'polilog.pl',
'pressto.amu.edu.pl',
Expand All @@ -652,8 +661,10 @@
'pyglobal.com',
'qualitativecriminology.com',
'radicalphilosophy.com',
'recyt.fecyt.es ',
'revistas.udd.cl',
'revistas.upr.edu',
'riviste.unimi.it',
'rjpn.org',
'sagepub.com',
'sagepublications.com',
Expand All @@ -668,6 +679,7 @@
'springer.com',
'tandfonline.com',
'taylorandfrancis.com',
'thebhs.org/publications',
'thelancet.com',
'tidsskrift.dk',
'umanisticadigitale.unibo.it',
Expand All @@ -680,7 +692,6 @@
'www.revistas.usp.br',
'xlink.rsc.org',
'zookeys.pensoft.net',
'doi.library.ubc.ca',
];

const JOURNAL_ARCHIVES_SITES = [
Expand All @@ -698,6 +709,7 @@
'perspectivia.net',
'works.bepress.com',
'zaguan.unizar.es',
'/doaj.org'
];

const PROXY_HOSTS_TO_ALWAYS_DROP = [
Expand Down Expand Up @@ -1211,9 +1223,11 @@
'.ft.com/',
'.google.com/',
'.hbw.com/',
'.healthaffairs.org/',
'.ietf.org/',
'.ign.com/',
'.jd.com/',
'.jove.com/',
'.lrb.co.uk/',
'.mic.com/',
'.muzines.co.uk/',
Expand All @@ -1226,6 +1240,7 @@
'.rt.com/',
'.svg.com/',
'.time.com/',
'.tnr.com/',
'.tvp.info/',
'.up.com/',
'.vk.com/',
Expand Down Expand Up @@ -1261,11 +1276,13 @@
'/ft.com/',
'/hbw.com/',
'/jd.com/',
'/jove.com/',
'/mic.com/',
'/nj.com/',
'/qq.com/',
'/rt.com/',
'/time.com/',
'/tnr.com/',
'/up.com/',
'/vk.com/',
'/x.com/',
Expand Down Expand Up @@ -1431,6 +1448,7 @@
'airspacemag.com/',
'airstream.com/',
'airvistara.com/',
'aisel.aisnet.org/',
'aisf.or.jp/',
'akasaair.com/',
'akitashoten.co.jp/',
Expand Down Expand Up @@ -1489,6 +1507,7 @@
'aparat.com/',
'apnews.com/',
'apple.com/',
'apress.com
'arabnews.com/',
'arcade-museum.com/',
'archdioceseofbombay.org/',
Expand Down Expand Up @@ -3113,6 +3132,7 @@
'curling.ca/',
'curling.org.nz/',
'curlingzone.com/',
'currentaffairs.org/',
'currentresults.com/',
'curtainup.com/',
'curtisbrown.co.uk/',
Expand Down Expand Up @@ -8769,6 +8789,7 @@
'politeianet.gr/',
'politicadigital.com.mx/',
'politicalgraveyard.com/',
'politicalresearch.org/',
'politicheagricole.it/',
'politico.com/',
'politics-prose.com/',
Expand Down Expand Up @@ -10645,6 +10666,7 @@
'taxfairnessabroad.org/',
'taxpolicycenter.org/',
'taxtimes.co.kr/',
'taylorfrancis.com/books/',
'tbheritage.com/',
'tbilisi.gov.ge/',
'tbs.co.jp/',
Expand All @@ -10662,6 +10684,7 @@
'tcpalm.com/',
'tcpipguide.com/',
'tdccolumbus.com/',
'tdcommons.org/',
'tdgarden.com/',
'tdplace.ca/',
'tdrsmusic.com/',
Expand Down Expand Up @@ -11895,6 +11918,7 @@
'watfordfc.com/',
'watson.de/',
'wba.co.uk/',
'wbc.poznan.pl/',
'weather-us.com/',
'weather.com/',
'weather.gov.sg/',
Expand Down

0 comments on commit fa88eb5

Please sign in to comment.