{-# LANGUAGE OverloadedStrings #-}
module Config.LinkLive where

import qualified Data.Text as T (isPrefixOf, isInfixOf, Text)

import Utils (setLike)

-- local relative path of Markdown source file to append links to via `writeLinkLiveTestcase` for manual review:
testPage :: FilePath
testPage = "lorem-link.md"

linkLivePrioritizeBlacklist :: [T.Text]
linkLivePrioritizeBlacklist = setLike ["omega.albany.edu"]
linkLivePrioritizeMinimum :: Int
linkLivePrioritizeMinimum = 3

-- hardwire URLs which should/should not be live
overrideLinkLive, overrideLinkLiveNot :: [T.Text]
overrideLinkLive = setLike []
overrideLinkLiveNot = setLike ["https://en.wikipedia.org/w/index.php?title=Genome-wide_complex_trait_analysis&oldid=871165308"]

wikipediaURLs :: [T.Text]
wikipediaURLs = setLike [".wikipedia.org"]

miscUrlRules :: T.Text -> Maybe Bool
miscUrlRules u
          |  "https://www.youtube.com/embed/" `T.isPrefixOf` u = Just True -- embeds do not set X-FRAME options, which is why they work & all other regular YT links do not:
          | "https://www.youtube.com/" `T.isPrefixOf` u = Just False
          -- Markdeep is a self-contained JS in-page-Markdown library, so the main homepage (regular HTML) works as a live popup, but not any of the demos (which need to run JS, which live popup iframes don't allow)
          | "https://casual-effects.com" `T.isPrefixOf` u = Just $ not $ ".md.html" `T.isInfixOf` u
          | otherwise = Nothing

-- all tested using `isDomain` in `Test`, and are unique lists, and no overlap between: `goodDomainsSub`/`badDomainsSub`, `goodDomainsSimple`/`badDomainsSimple`, `goodLinks`/`badLinks`.
goodDomainsSub, goodDomainsSimple, badDomainsSub, badDomainsSimple, goodLinks, badLinks :: [T.Text]
goodDomainsSub = setLike [".allennlp.org", ".archive.org", ".archiveteam.org", ".bandcamp.com", ".eleuther.ai", ".fandom.com"
                 , ".github.io", ".givewell.org", ".greenspun.com", ".imagemagick.org", ".mementoweb.org"
                 , ".metafilter.com", ".nomeata.de", ".obormot.net", ".tumblr.com", ".xkcd.com", ".wordpress.com"
                 , ".blogspot.com"]
goodDomainsSimple = setLike
  ["1dollarscan.com"
    , "humanprogress.org"
    , "6thfloor.blogs.nytimes.com"
    , "80000hours.org"
    , "abandonedfootnotes.blogspot.com"
    , "abcnews.go.com"
    , "abcnotation.com"
    , "about.google"
    , "academictorrents.com"
    , "aclanthology.org"
    , "ageing.oxfordjournals.org"
    , "ageofem.com"
    , "agtb.wordpress.com"
    , "ai.google"
    , "aiimpacts.org"
    , "aleph.se"
    , "alexanderetz.com"
    , "altjapan.typepad.com"
    , "andrewmayne.com"
    , "andymatuschak.org"
    , "andzuck.com"
    , "animekritik.wordpress.com"
    , "ansuz.sooke.bc.ca"
    , "apenwarr.ca"
    , "archinte.jamanetwork.com"
    , "architext.design"
    , "archivebox.io"
    , "archive.nytimes.com"
    , "archive.org"
    , "archive.seattletimes.com"
    , "arima.cylab.cmu.edu"
    , "arr.am"
    , "articles.latimes.com"
    , "asktog.com"
    , "bair.berkeley.edu"
    , "bam.kalzumeus.com"
    , "beepb00p.xyz"
    , "behavioralscientist.org"
    , "bellard.org"
    , "beza1e1.tuxen.de"
    , "bitcoin-otc.com"
    , "bits.blogs.nytimes.com"
    , "bldgblog.com"
    , "blog.8faces.com"
    , "blog.beeminder.com"
    , "blog.codinghorror.com"
    , "blog.cr.yp.to"
    , "blog.cryptographyengineering.com"
    , "blog.csdn.net"
    , "blog.ethereum.org"
    , "blog.google"
    , "blog.google.com"
    , "blog.nuclearsecrecy.com"
    , "blog.otoro.net"
    , "blog.pinboard.in"
    , "blog.regehr.org"
    , "blogs.lanecc.edu"
    , "blogs.wsj.com"
    , "blog.thinkst.com"
    , "blog.youtube"
    , "bmk.sh"
    , "boingboing.net"
    , "b-ok.cc"
    , "bwc.thelab.dc.gov"
    , "cacm.acm.org"
    , "caniuse.com"
    , "carbonplan.org"
    , "catonmat.net"
    , "cat-unbound.org"
    , "cdn.openai.com"
    , "cognitivemedium.com"
    , "commons.wikimedia.org"
    , "compdemocracy.org"
    , "complearn.org"
    , "conifer.rhizome.org"
    , "corpgov.law.harvard.edu"
    , "courses.csail.mit.edu"
    , "cran.r-project.org"
    , "crookedtimber.org"
    , "cs.stanford.edu"
    , "ctan.org"
    , "culture.org"
    , "daniellakens.blogspot.com"
    , "danluu.com"
    , "danwang.co"
    , "datacolada.org"
    , "dataprivacylab.org"
    , "davidepstein.com"
    , "dealbook.nytimes.com"
    , "defector.com"
    , "digital.library.unt.edu"
    , "distill.pub"
    , "diyhpl.us"
    , "docs.google.com"
    , "dominiccummings.com"
    , "donsbot.com"
    , "downloads.haskell.org"
    , "dresdencodak.com"
    , "dumps.wikimedia.org"
    , "dwarffortresswiki.org"
    , "e2eml.school"
    , "egamebook.com"
    , "eileenormsby.com"
    , "eli.thegreenplace.net"
    , "emilkirkegaard.dk"
    , "energycontrol.org"
    , "engineering.fb.com"
    , "en.wikibooks.org"
    , "en.wikichip.org"
    , "en.wikiquote.org"
    , "en.wikisource.org"
    , "en.wiktionary.org"
    , "eprint.iacr.org"
    , "equilibriabook.com"
    , "esolangs.org"
    , "etienne.se"
    , "eukaryotewritesblog.com"
    , "eva-fan.com"
    , "evaotaku.com"
    , "exac.broadinstitute.org"
    , "explorabl.es"
    , "extras.denverpost.com"
    , "familiarcycle.net"
    , "fastmoe.ai"
    , "fasttext.cc"
    , "files.eric.ed.gov"
    , "foreignpolicy.com"
    , "forre.st"
    , "forum.effectivealtruism.org"
    , "forum.evageeks.org"
    , "forum.quantifiedself.com"
    , "forums.animesuki.com"
    , "foundation.wikimedia.org"
    , "freedomdefined.org"
    , "fullfrontal.moe"
    , "futurism.com"
    , "galois.com"
    , "gamefaqs.gamespot.com"
    , "gameprogrammingpatterns.com"
    , "gaotianyu.xyz"
    , "gizmodo.com.au"
    , "globalguerrillas.typepad.com"
    , "globalvoices.org"
    , "gondwanaland.com"
    , "googleblog.blogspot.com"
    , "googleprojectzero.blogspot.com"
    , "google-summer-of-code-2009-haskell.googlecode.com"
    , "googlesystem.blogspot.com"
    , "gpt3demo.com"
    , "gradientscience.org"
    , "greaterwrong.com"
    , "ea.greaterwrong.com"
    , "arbital.greaterwrong.com"
    , "gutenberg.ca"
    , "gutenberg.net.au"
    , "guzey.com"
    , "gwern.net"
    , "hackage.haskell.org"
    , "hakaimagazine.com"
    , "handbook-5-1.cochrane.org"
    , "hapgood.us"
    , "harpers.org"
    , "hdsr.mitpress.mit.edu"
    , "healthland.time.com"
    , "herbsutter.com"
    , "highnoongmt.wordpress.com"
    , "historycooperative.org"
    , "hpmor.com"
    , "hub.darcs.net"
    , "ideas.repec.org"
    , "idlewords.com"
    , "ifdo.ca"
    , "iforcedabot.com"
    , "image-net.org"
    , "infoproc.blogspot.com"
    , "inhumanexperiment.blogspot.com"
    , "intelligence.org"
    , "iqcomparisonsite.com"
    , "isomerdesign.com"
    , "jakewestfall.org"
    , "jamesyu.org"
    , "japansociety.org"
    , "jasoncrawford.org"
    , "jaspervdj.be"
    , "jax.readthedocs.io"
    , "jaypsong.blog"
    , "jdlm.info"
    , "jessegalef.com"
    , "jetpress.org"
    , "jgeekstudies.org"
    , "joa.sh"
    , "johncwright.livejournal.com"
    , "jonmillward.com"
    , "journal.stuffwithstuff.com"
    , "jtauber.com"
    , "jtoomim.org"
    , "justgetflux.com"
    , "kajsotala.fi"
    , "kalzumeus.com"
    , "keras.io"
    , "kev.town"
    , "kk.org"
    , "knightcolumbia.org"
    , "kojimars.at.webry.info"
    , "komonews.com"
    , "krebsonsecurity.com"
    , "laion.ai"
    , "langsec.org"
    , "lavaan.ugent.be"
    , "learning.mpi-sws.org"
    , "ledge-cli.org"
    , "ledger-cli.org"
    , "lesswrong.com"
    , "lettersofnote.com"
    , "libgen.li"
    , "lifescivc.com"
    , "lithub.com"
    , "longitudinal.blog"
    , "longtermrisk.org"
    , "lucumr.pocoo.org"
    , "magazine.atavist.com"
    , "magenta.tensorflow.org"
    , "mailchi.mp"
    , "mail.haskell.org"
    , "mako.cc"
    , "mason.gmu.edu"
    , "mathbabe.org"
    , "mathshistory.st-andrews.ac.uk"
    , "mathworld.wolfram.com"
    , "mattlakeman.org"
    , "mattmahoney.net"
    , "mc-stan.org"
    , "meta.wikimedia.org"
    , "meteuphoric.com"
    , "metropolitician.blogs.com"
    , "michaelnielsen.org"
    , "mikepower.pressfolios.com"
    , "milan.cvitkovic.net"
    , "minimaxir.com"
    , "mitpress.mit.edu"
    , "mkv25.net"
    , "ml.berkeley.edu"
    , "mmlab.ie.cuhk.edu.hk"
    , "mssv.net"
    , "my.pgp-hms.org"
    , "my.vanderbilt.edu"
    , "nautil.us"
    , "www.nbc-2.com"
    , "ncase.me"
    , "neurosciencenews.com"
    , "newcriterion.com"
    , "news.nationalgeographic.com"
    , "ngm.nationalgeographic.com"
    , "nickbostrom.com"
    , "nintil.com"
    , "nootropicsdepot.com"
    , "norvig.com"
    , "notes.pinboard.in"
    , "numinous.productions"
    , "nunosempere.com"
    , "nymag.com"
    , "ohtori.nu"
    , "okmij.org"
    , "online.wsj.com"
    , "ooo.ghostbows.ooo"
    , "opinionator.blogs.nytimes.com"
    , "originstamp.com"
    , "orionmagazine.org"
    , "orwell.ru"
    , "oscarbonilla.com"
    , "ourworldindata.org"
    , "packdeps.haskellers.com"
    , "palmerlab.org"
    , "pandoc.org"
    , "papers.ssrn.com"
    , "parahumans.wordpress.com"
    , "parametric.press"
    , "parti.research.google"
    , "patrickcollison.com"
    , "paulfchristiano.com"
    , "pdfs.semanticscholar.org"
    , "penelope.uchicago.edu"
    , "people.com"
    , "people.csail.mit.edu"
    , "people.idsia.ch"
    , "personalitytest.net"
    , "personal.math.ubc.ca"
    , "petertodd.org"
    , "pinboard.in"
    , "plato.stanford.edu"
    , "playground.tensorflow.org"
    , "politicalcalculations.blogspot.com"
    , "popcon.ubuntu.com"
    , "proceedings.mlr.press"
    , "programme.exordo.com"
    , "progressstudies.school"
    , "projects.jsonline.com"
    , "projects.tampabay.com"
    , "psychcentral.com"
    , "psych.hanover.edu"
    , "psychonautwiki.org"
    , "publishing.cdlib.org"
    , "pudding.cool"
    , "pytorch.org"
    , "qualiacomputing.com"
    , "quantifiedself.com"
    , "quantum.country"
    , "queue.acm.org"
    , "quillette.com"
    , "quinndunki.com"
    , "qwantz.com"
    , "r6.ca"
    , "racket-lang.org"
    , "radiolab.org"
    , "ralphmerkle.com"
    , "rationality.org"
    , "rdiff-backup.net"
    , "read-the-samples.netlify.app"
    , "reflectivedisequilibrium.blogspot.com"
    , "replicationindex.com"
    , "retractionwatch.com"
    , "ricon.dev"
    , "rjlipton.com"
    , "blog.rootsofprogress.org"
    , "row1.ca"
    , "safebooru.org"
    , "samoburja.com"
    , "scale.com"
    , "scarybeastsecurity.blogspot.com"
    , "scholars-stage.org"
    , "schoolgirlmilkycrisis.com"
    , "sciencebasedmedicine.org"
    , "sciencebulletin.org"
    , "science.ksc.nasa.gov"
    , "scientistatwork.blogs.nytimes.com"
    , "scottaaronson.blog"
    , "seths.blog"
    , "sevensecularsermons.org"
    , "sf-encyclopedia.com"
    , "shiny.app"
    , "shkspr.mobi"
    , "sifter.org"
    , "signalvnoise.com"
    , "slatestarcodex.com"
    , "slimemoldtimemold.com"
    , "socghop.appspot.com"
    , "socialsciences.mcmaster.ca"
    , "soranews24.com"
    , "spikejapan.wordpress.com"
    , "spp.fas.org"
    , "srconstantin.wordpress.com"
    , "sre.google"
    , "stats.grok.se"
    , "status451.com"
    , "stephenmalina.com"
    , "stevenson.lab.uconn.edu"
    , "story.californiasunday.com"
    , "stratechery.com"
    , "strategy.wikimedia.org"
    , "svilentodorov.xyz"
    , "synapse.koreamed.org"
    , "taooftea.com"
    , "teageegeepea.tripod.com"
    , "texample.net"
    , "text.npr.org"
    , "thebaffler.com"
    , "thebrowser.com"
    , "thegrandnarrative.com"
    , "thehardestscience.com"
    , "thelastpsychiatrist.com"
    , "the-liliquarium.livejournal.com"
    , "thenewstatistics.com"
    , "the-toast.net"
    , "thisanimedoesnotexist.ai"
    , "thiseyedoesnotexist.com"
    , "thisrentaldoesnotexist.com"
    , "thoughtcrime.crummy.com"
    , "threadreaderapp.com"
    , "time.com"
    , "tomcritchlow.com"
    , "tools.wmflabs.org"
    , "tosche.net"
    , "training.kalzumeus.com"
    , "transformer-circuits.pub"
    , "trixter.oldskool.org"
    , "tug.org"
    , "unenumerated.blogspot.com"
    , "unqualified-reservations.blogspot.com"
    , "unsongbook.com"
    , "upload.wikimedia.org"
    , "vasilishynkarenka.com"
    , "vastabrupt.com"
    , "vast.ai"
    , "vdfresearch.org"
    , "venturebeat.com"
    , "vfxblog.com"
    , "videolectures.net"
    , "vinoshipper.com"
    , "warontherocks.com"
    , "washingtonmonthly.com"
    , "w.atwiki.jp"
    , "wavemotioncannon.com"
    , "wayback.archive-it.org"
    , "web.archive.org"
    , "webcitation.org"
    , "web.media.mit.edu"
    , "web.stanford.edu"
    , "well.blogs.nytimes.com"
    , "whyevolutionistrue.com"
    , "wiki.haskell.org"
    , "wiki.lesswrong.com"
    , "wikimediafoundation.org"
    , "writeswith.com"
    , "writings.stephenwolfram.com"
    , "www6.austlii.edu.au"
    , "www.abcb.com"
    , "www.aboutamazon.com"
    , "www.adamsmith.org"
    , "www.adelaidenow.com.au"
    , "www.aging-us.com"
    , "www.aiweirdness.com"
    , "www.alcor.org"
    , "www.aleph.se"
    , "www.alessonislearned.com"
    , "www.alexirpan.com"
    , "www.alicemaz.com"
    , "www.alignmentforum.org"
    , "www.allencheng.com"
    , "www.antipope.org"
    , "archive-it.org"
    , "www.artnome.com"
    , "www.baka-tsuki.org"
    , "www.baltimoresun.com"
    , "www.becker-posner-blog.com"
    , "www.belfasttelegraph.co.uk"
    , "www.bemmu.com"
    , "www.benkuhn.net"
    , "www.bitsaboutmoney.com"
    , "www.bostonglobe.com"
    , "www.brainpreservation.org"
    , "www.brookings.edu"
    , "www.bu.edu"
    , "www.businessweek.com"
    , "www.buzzricksons.jp"
    , "www.c82.net"
    , "www.candyjapan.com"
    , "www.catalogtree.net"
    , "www.cato-unbound.org"
    , "www.cbsnews.com"
    , "www.cdc.gov"
    , "www.chicagotribune.com"
    , "www.chinadaily.com.cn"
    , "www.chrisplaysgames.com"
    , "www.chrisstucchio.com"
    , "www.cjas.org"
    , "www.cleveland.com"
    , "www.cnn.com"
    , "www.coderelay.io"
    , "www.cogmed.com"
    , "www.collectorsweekly.com"
    , "www.couriermail.com.au"
    , "www.cryonicscalculator.com"
    , "www.cs.dartmouth.edu"
    , "www-cs-faculty.stanford.edu"
    , "www.cs.odu.edu"
    , "www.cs.toronto.edu"
    , "www.cs.virginia.edu"
    , "www.culhwch.info"
    , "www.cylab.cmu.edu"
    , "www.daemonology.net"
    , "www.dafont.com"
    , "www.dailydot.com"
    , "www.dailymail.co.uk"
    , "www.dartmouth.edu"
    , "www.davidbordwell.net"
    , "www.davidbrin.com"
    , "www.deeplearningbook.org"
    , "www.deseret.com"
    , "www.discoverteas.com"
    , "www.doc88.com"
    , "www.drmaciver.com"
    , "www.e-codices.unifr.ch"
    , "www.ecologyandsociety.org"
    , "www.econlib.org"
    , "www.economist.com"
    , "www.econtalk.org"
    , "www.eduref.net"
    , "www.edwardtufte.com"
    , "www.equator-network.org"
    , "www.equestriadaily.com"
    , "www.eugenewei.com"
    , "www.evamonkey.com"
    , "www.evaotaku.com"
    , "www.explainxkcd.com"
    , "www.fadedpage.com"
    , "www.fast.ai"
    , "www.fhi.ox.ac.uk"
    , "www.filfre.net"
    , "www.find-more-books.com"
    , "www.freakonomicsexperiments.com"
    , "www.ft.com"
    , "www.galbithink.org"
    , "gawker.com"
    , "www.genealogy.math.ndsu.nodak.edu"
    , "www.ghibli.jp"
    , "www.globalsecurity.org"
    , "www.gnxp.com"
    , "www.gq.com"
    , "www.grandforksherald.com"
    , "www.greaterwrong.com"
    , "www.gutenberg.org"
    , "www.harrowell.org.uk"
    , "www.hbs.edu"
    , "www.heraldsun.com.au"
    , "www.hsx.com"
    , "www.html-tidy.org"
    , "www.independent.ie"
    , "www.infranken.de"
    , "www.inkandswitch.com"
    , "www.intechopen.com"
    , "www.itmedia.co.jp"
    , "www.jamesfadiman.com"
    , "www.japaninc.com"
    , "www.jdmoyer.com"
    , "www.jefftk.com"
    , "www.joelonsoftware.com"
    , "www.johndcook.com"
    , "www.johnsonessays.com"
    , "www.justinpinkney.com"
    , "www.kalzumeus.com"
    , "www.kooslooijesteijn.net"
    , "www.koreatimes.co.kr"
    , "www.lehighvalleylive.com"
    , "www.lesswrong.com"
    , "www.livestrong.com"
    , "www.mail-archive.com"
    , "www.math.uwaterloo.ca"
    , "www.mcall.com"
    , "www.mediawiki.org"
    , "www.mentalfloss.com"
    , "www.mercurynews.com"
    , "www.metafor-project.org"
    , "www.metopera.org"
    , "www.metzdowd.com"
    , "www.miamiherald.com"
    , "www.michaellight.net"
    , "www.microdose.me"
    , "www.moserware.com"
    , "www.motherjones.com"
    , "www.nationalgeographic.com"
    , "www.nbcnews.com"
    , "www.newsday.com"
    , "www.nextbigfuture.com"
    , "www.nextplatform.com"
    , "www.noisebridge.net"
    , "www.nplusonemag.com"
    , "www.npr.org"
    , "www.nps.gov"
    , "www.nyaa.eu"
    , "www.nydailynews.com"
    , "www.ohyouprettythings.com"
    , "www.orbuch.com"
    , "www.oregonlive.com"
    , "www.oricon.co.jp"
    , "www.orlandosentinel.com"
    , "www.owenstephens.co.uk"
    , "www.palladiummag.com"
    , "www.pcmag.com"
    , "www.pewresearch.org"
    , "www.poetryfoundation.org"
    , "www.popsci.com"
    , "www.pragmatic.ml"
    , "www.prolific.com"
    , "www.psychiatryinvestigation.org"
    , "www.punchlinedesign.net"
    , "www.rationaloptimist.com"
    , "www.r-bloggers.com"
    , "www.rdocumentation.org"
    , "www.reg.ru"
    , "www.rfreitas.com"
    , "www.ribbonfarm.com"
    , "www.richardcarrier.info"
    , "www.rifters.com"
    , "www.righto.com"
    , "www.ruder.io"
    , "www.rwagner.net"
    , "www.rxshop.md"
    , "www.sacbee.com"
    , "www.salon.com"
    , "news.sankakucomplex.com"
    , "www.sapa-project.org"
    , "www.schneier.com"
    , "www.scielo.br"
    , "www.scienceagogo.com"
    , "www.sciencemadness.org"
    , "www.sciencenews.org"
    , "www.scottaaronson.com"
    , "www.sfgate.com"
    , "www.shawlocal.com"
    , "www.shawwn.com"
    , "www.silverhandmeadery.com"
    , "www.simplify.so"
    , "www.sirlin.net"
    , "www.slate.com"
    , "www.sleep-journal.com"
    , "www.snpedia.com"
    , "www.spiegel.de"
    , "www.spiked-online.com"
    , "www.spring.org.uk"
    , "www.sqlite.org"
    , "www.ssc.wisc.edu"
    , "www.standard.co.uk"
    , "www.stat.columbia.edu"
    , "www.straighttalkonevidence.org"
    , "www.stripes.com"
    , "www.stuff.co.nz"
    , "www.sumsar.net"
    , "www.sun-modalert.com"
    , "www.syracuse.com"
    , "www.systutorials.com"
    , "talyarkoni.org"
    , "www.tarsnap.com"
    , "www.thebeliever.net"
    , "www.thecut.com"
    , "www.thedenverchannel.com"
    , "www.thefreelibrary.com"
    , "www.theindiaforum.in"
    , "www.themtank.org"
    , "www.theregister.com"
    , "www.thesmokinggun.com"
    , "www.thestranger.com"
    , "www.thisfursonadoesnotexist.com"
    , "www.thispersondoesnotexist.com"
    , "www.thiswaifudoesnotexist.net"
    , "www.thisworddoesnotexist.com"
    , "www.thriftbooks.com"
    , "www.tlmc.eu"
    , "tomodachi.de"
    , "www.tor.com"
    , "www.tranquiltuesdays.com"
    , "www.trentonbricken.com"
    , "www.trubrain.com"
    , "www.tt-forums.net"
    , "www.ubu.com"
    , "www.uk-anime.net"
    , "www.uliwestphal.de"
    , "www.unc.edu"
    , "www.unicode.org"
    , "www.unqualified-reservations.org"
    , "www.unz.com"
    , "www.urbandharma.org"
    , "www.urbandictionary.com"
    , "www.usnews.com"
    , "www.vanityfair.com"
    , "www.vesta.earth"
    , "www.vetta.org"
    , "www.vocativ.com"
    , "www.wakapoetry.net"
    , "www.washingtontimes.com"
    , "www.webmd.com"
    , "www.wheels.org"
    , "www.whichfaceisreal.com"
    , "www.winehq.org"
    , "www.wired.com"
    , "www.wired.co.uk"
    , "www.wolfewiki.com"
    , "www.writingroutines.com"
    , "www.yalelawjournal.org"
    , "www.yf.io"
    , "www.yourdictionary.com"
    , "www.yudkowsky.net"
    , "www.zeit.de"
    , "xkcd.com"
    , "xtools.wmflabs.org"
    , "zlkj.in"
    , "researchers.wls.wisc.edu"
    , "mitp-content-server.mit.edu"
    , "dialnet.unirioja.es"
    , "www.princeton.edu"
    , "sites.temple.edu"
    , "ai.stanford.edu"
    , "alexdanco.com"
    , "andyljones.com"
    , "bayesianinvestor.com"
    , "blog.samaltman.com"
    , "books.worksinprogress.co"
    , "carryiton.net"
    , "colinraffel.com"
    , "conversationswithtyler.com"
    , "cs.nyu.edu"
    , "danijar.com"
    , "dataverse.harvard.edu"
    , "geminiprotocol.net"
    , "gigamonkeys.com"
    , "internetshakespeare.uvic.ca"
    , "jack-clark.net"
    , "maggieappleton.com"
    , "nlp.stanford.edu"
    , "ocw.mit.edu"
    , "oeis.org"
    , "paulgraham.com"
    , "psychclassics.yorku.ca"
    , "senseis.xmp.net"
    , "verdagon.dev"
    , "waitbutwhy.com"
    , "wordcraft-writers-workshop.appspot.com"
    , "www.centauri-dreams.org"
    , "www.cerebras.net"
    , "www.cognition.ai"
    , "www.cryonicsarchive.org"
    , "www.cs.cmu.edu"
    , "www.feynmanlectures.caltech.edu"
    , "www.folger.edu"
    , "www.hustwit.com"
    , "www.icpsr.umich.edu"
    , "www.mattridley.co.uk"
    , "www.semafor.com"
    , "www.spencergreenberg.com"
    , "www8.austlii.edu.au"
    , "dynomight.net"
    , "sander.ai"
    , "www.chiark.greenend.org.uk"
    , "acoup.blog"
    , "static.googleusercontent.com"
    , "blondihacks.com"
    ]

badDomainsSub = setLike [".plos.org", ".royalsocietypublishing.org", ".substack.com", ".stackexchange.com",
                 ".oxfordjournals.org", ".medium.com", ".translate.goog"]
badDomainsSimple = setLike ["2chan.us"
   , "1d4chan.org"
   , "5onwnspjvuk7cwvk.tor2web.org"
   , "a16z.com"
   , "abebooks.com"
   , "about.netflix.com"
   , "academia.edu"
   , "adage.com"
   , "addons.mozilla.org"
   , "advancedfertility.com"
   , "aeon.co"
   , "ai-alignment.com"
   , "aidungeon.medium.com"
   , "ai.meta.com"
   , "ajcn.nutrition.org"
   , "ajph.aphapublications.org"
   , "ajp.psychiatryonline.org"
   , "aka.ms"
   , "almanac.httparchive.org"
   , "amstat.tandfonline.com"
   , "andrewbadr.com"
   , "anidb.net"
   , "animesuperhero.com"
   , "ankiweb.net"
   , "annals.org"
   , "answers.google.com"
   , "antilop.cc"
   , "apastyle.apa.org"
   , "api.research-repository.uwa.edu.au"
   , "app.inferkit.com"
   , "apps.ankiweb.net"
   , "apps.apple.com"
   , "apps.dtic.mil"
   , "arbital.com"
   , "archinte.ama-assn.org"
   , "archive.foolz.us"
   , "archive.ilr.cornell.edu"
   , "archive.is"
   , "archiveofourown.org"
   , "archive-ouverte.unige.ch"
   , "archive.recapthelaw.org"
   , "archives.haskell.org"
   , "archpsyc.ama-assn.org"
   , "arstechnica.com"
   , "artbreeder.com"
   , "arxiv.org"
   , "arxiv-vanity.com"
   , "ascii.textfiles.com"
   , "ase.uva.nl"
   , "www.astralcodexten.com"
   , "augmentingcognition.com"
   , "au.news.yahoo.com"
   , "aur.archlinux.org"
   , "aurellem.org"
   , "aws.amazon.com"
   , "azure.microsoft.com"
   , "babel.hathitrust.org"
   , "bactra.org"
   , "bakabt.me"
   , "bam-dataset.org"
   , "bartokdesign.com"
   , "bastiat.org"
   , "bayes.wustl.edu"
   , "beautifultaiwantea.com"
   , "beerconnoisseur.com"
   , "bellroy.com"
   , "benbest.com"
   , "berkshirehathaway.com"
   , "beta.openai.com"
   , "betsofbitco.in"
   , "betterhumans.coach.me"
   , "betterworldbooks.com"
   , "bgr.com"
   , "bibliophilly.library.upenn.edu"
   , "bifunctor.homelinux.net"
   , "bigquery.cloud.google.com"
   , "bioinfo.pl"
   , "biomedcentral.com"
   , "bitbucket.org"
   , "bitcoincharts.com"
   , "bitcoins-code.de"
   , "bitcointalk.org"
   , "bit-player.org"
   , "bjo.bmj.com"
   , "bjp.rcpsych.org"
   , "bjsm.bmj.com"
   , "blockchain.info"
   , "blog.23andme.com"
   , "blog.dansimons.com"
   , "blog.darcs.net"
   , "blog.darknedgy.net"
   , "blog.fc2.com"
   , "blog.johantibell.com"
   , "blog.ml.cmu.edu"
   , "blog.mozilla.org"
   , "blog.nuclino.com"
   , "blog.platypope.org"
   , "blog.sigfpe.com"
   , "blogs.microsoft.com"
   , "blogs.nature.com"
   , "blogs.nvidia.com"
   , "blogs.princeton.edu"
   , "blogs.scientificamerican.com"
   , "blog.torproject.org"
   , "blog.x.com"
   , "bluelight.org"
   , "bmcmedresmethodol.biomedcentral.com"
   , "bmcneurosci.biomedcentral.com"
   , "bmcpublichealth.biomedcentral.com"
   , "bmcvetres.biomedcentral.com"
   , "boardgamegeek.com"
   , "boa.unimib.it"
   , "boinngerionn.blog.fc2.com"
   , "book.realworldhaskell.org"
   , "books.google.com"
   , "book.webtypography.net"
   , "boston.conman.org"
   , "brainworkshop.sourceforge.net"
   , "bsapubs.onlinelibrary.wiley.com"
   , "buddhism-for-vampires.com"
   , "bugs.darcs.net"
   , "bugs.debian.org"
   , "bugs.launchpad.net"
   , "buttercupfestival.com"
   , "cabinetmagazine.org"
   , "caes.ucdavis.edu"
   , "calhoun.nps.edu"
   , "camelcamelcamel.com"
   , "capitalteas.com"
   , "capsuleconnection.com"
   , "case.edu"
   , "casetext.com"
   , "catb.org"
   , "catless.ncl.ac.uk"
   , "ccc.de"
   , "cdm16630.contentdm.oclc.org"
   , "cep.lse.ac.uk"
   , "cfa.org"
   , "chrome.google.com"
   , "chroniclingamerica.loc.gov"
   , "chronopause.com"
   , "ciechanow.ski"
   , "circ.ahajournals.org"
   , "cis.org"
   , "citeseerx.ist.psu.edu"
   , "clagnut.com"
   , "clarkesworldmagazine.com"
   , "clickotron.com"
   , "clinicalepigeneticsjournal.biomedcentral.com"
   , "clinicaltrials.gov"
   , "cloud.google.com"
   , "code.google.com"
   , "code.visualstudio.com"
   , "colab.research.google.com"
   , "collections.library.yale.edu"
   , "collider.com"
   , "comicsalliance.com"
   , "community.arm.com"
   , "community.haskell.org"
   , "console.aws.amazon.com"
   , "console.cloud.google.com"
   , "corante.com"
   , "core.ac.uk"
   , "cosmosmagazine.com"
   , "course.fast.ai"
   , "coveryourtracks.eff.org"
   , "creativecommons.org"
   , "creyos.com"
   , "cro.sagepub.com"
   , "cryptome.org"
   , "crypto.stackexchange.com"
   , "cse.google.com"
   , "csimq-journals.rtu.lv"
   , "csrc.nist.gov"
   , "ctc.usma.edu"
   , "cyber.harvard.edu"
   , "dailyvoice.com"
   , "dalspace.library.dal.ca"
   , "danbooru.donmai.us"
   , "danfrank.ca"
   , "darcs.net"
   , "darkdata.bc.edu"
   , "darknetlive.com"
   , "darwin-online.org.uk"
   , "datasetsearch.research.google.com"
   , "data.worldbank.org"
   , "de1.erowid.org"
   , "deadline.com"
   , "deadspin.com"
   , "dee.su"
   , "dept.wofford.edu"
   , "derpibooru.org"
   , "devblogs.microsoft.com"
   , "developer.mozilla.org"
   , "developer.nvidia.com"
   , "developer.x.com"
   , "dev.kanotype.net"
   , "dharmaoverground.org"
   , "digitalcommons.unl.edu"
   , "discord.com"
   , "disease-connect.org"
   , "dl.acm.org"
   , "dl.dropboxusercontent.com"
   , "dnd.wizards.com"
   , "docs.microsoft.com"
   , "donate.torproject.org"
   , "drive.google.com"
   , "droitwichstandard.co.uk"
   , "drugs-forum.com"
   , "dspace.mit.edu"
   , "dual-n-back.com"
   , "duckduckgo.com"
   , "duolingo.com"
   , "duplicity.nongnu.org"
   , "dzone.com"
   , "e621.net"
   , "eab.sagepub.com"
   , "economics.stanford.edu"
   , "econ.vt.edu"
   , "ec.toranoana.jp"
   , "ectoranoana.jp"
   , "eepurl.com"
   , "eg-2.hatenablog.com"
   , "ehp.niehs.nih.gov"
   , "eiga.com"
   , "ejlt.org"
   , "elifesciences.org"
   , "emacswiki.org"
   , "eml.berkeley.edu"
   , "en.chessbase.com"
   , "endlessvn.io"
   , "eng.uber.com"
   , "en.touhouwiki.net"
   , "environhealthprevmed.biomedcentral.com"
   , "en.wik%20ipedia.org"
   , "en.wikip%20edia.org"
   , "eprints.lincoln.ac.uk"
   , "eprints.nottingham.ac.uk"
   , "eprints.whiterose.ac.uk"
   , "ergodox-ez.com"
   , "eric.ed.gov"
   , "ero.sagepub.com"
   , "erowid.org"
   , "esajournals.onlinelibrary.wiley.com"
   , "escholarship.org"
   , "espace.library.uq.edu.au"
   , "esr.ibiblio.org"
   , "ethics.emory.edu"
   , "ethos.bl.uk"
   , "eth.wiki"
   , "eurekamag.com"
   , "eurfa.org.uk"
   , "eva.onegeek.org"
   , "everyoneishappy.com"
   , "everything2.com"
   , "every.to"
   , "evigio.com"
   , "examine.com"
   , "exrx.net"
   , "eztest.com"
   , "f1000research.com"
   , "faculty.virginia.edu"
   , "fdaaa.trialstracker.net"
   , "feeds.feedburner.com"
   , "fifteen.ai"
   , "fightaging.org"
   , "finance.yahoo.com"
   , "fis.fda.gov"
   , "fivethirtyeight.com"
   , "flatisjustice.moe"
   , "floatingleaves.com"
   , "fn.bmj.com"
   , "fnb.sagepub.com"
   , "folding.stanford.edu"
   , "folkrnn.org"
   , "fontsinuse.com"
   , "food52.com"
   , "fortune.com"
   , "forums.somethingawful.com"
   , "fred.stlouisfed.org"
   , "freedom-to-tinker.com"
   , "fs.blog"
   , "ftp.cs.ucla.edu"
   , "fursona.app"
   , "gainax.co.jp"
   , "gainax.fr"
   , "gallica.bnf.fr"
   , "gazette.com"
   , "gcta.freeforums.net"
   , "geneatlas.roslin.ed.ac.uk"
   , "genepi.qimr.edu.au"
   , "geneticalliance.org.uk"
   , "genius.com"
   , "genomebiology.biomedcentral.com"
   , "genomemedicine.biomedcentral.com"
   , "georgianjournal.ge"
   , "geroprotectors.org"
   , "getd.libs.uga.edu"
   , "getlamp.com"
   , "gettermario.dynamicforum.net"
   , "gigaom.com"
   , "gigascience.biomedcentral.com"
   , "gigazine.net"
   , "gist.github.com"
   , "gitcoin.co"
   , "gitgud.io"
   , "github.com"
   , "git.io"
   , "gitlab.com"
   , "gitlab.developers.cam.ac.uk"
   , "gitlab.haskell.org"
   , "gitlab.torproject.org"
   , "git-scm.com"
   , "gizmodo.com"
   , "glench.com"
   , "gmane.org"
   , "godanriver.com"
   , "goo.gl"
   , "goproblems.com"
   , "gptprompts.wikidot.com"
   , "granta.com"
   , "grantland.com"
   , "greekreporter.com"
   , "groups.google.com"
   , "groups.yahoo.com"
   , "gsejournal.biomedcentral.com"
   , "gwern.shinyapps.io"
   , "h01-dot-neuroglancer-demo.appspot.com"
   , "habr.com"
   , "hacks.mozilla.org"
   , "hal.science"
   , "handbook.cochrane.org"
   , "hansard.parliament.uk"
   , "hardcoresoftware.learningbyshipping.com"
   , "harmreductionjournal.biomedcentral.com"
   , "hashcat.net"
   , "haveibeenpwned.com"
   , "hazuma.hatenablog.com"
   , "hbr.org"
   , "hcommons.org"
   , "help.duckduckgo.com"
   , "history.nasa.gov"
   , "hivemind-repo.s3-us-west-2.amazonaws.com"
   , "hn.algolia.com"
   , "hn-sicp.pbworks.com"
   , "hoaxes.org"
   , "hollisarchives.lib.harvard.edu"
   , "home.inklingmarkets.com"
   , "homepage3.nifty.com"
   , "hoogle.haskell.org"
   , "host.robots.ox.ac.uk"
   , "hrcak.srce.hr"
   , "httparchive.org"
   , "huggingface.co"
   , "hum.sagepub.com"
   , "hutter1.net"
   , "icosahedron.website"
   , "ideas.4brad.com"
   , "ide.mit.edu"
   , "ieeexplore.ieee.org"
   , "if50.substack.com"
   , "ignorethecode.net"
   , "i.imgur.com"
   , "ije.oxfordjournals.org"
   , "ilovetypography.com"
   , "imagelibrary.bgu.ac.il"
   , "images.google.com"
   , "imgur.com"
   , "inews.co.uk"
   , "infidels.org"
   , "informallogic.ca"
   , "inklingmarkets.com"
   , "interviews.slashdot.org"
   , "intrade.com"
   , "iopscience.iop.org"
   , "iqout.com"
   , "iqtest.com"
   , "iqtest.dk"
   , "irs.princeton.edu"
   , "isfdb.org"
   , "iterative.capital"
   , "itre.cis.upenn.edu"
   , "it.slashdot.org"
   , "jacobsschool.ucsd.edu"
   , "jacurutu.com"
   , "jalopnik.com"
   , "jamestown.org"
   , "japanintercultural.com"
   , "jasbsci.biomedcentral.com"
   , "jcsm.aasm.org"
   , "jidinews.com"
   , "jigsaw.w3.org"
   , "jme.bmj.com"
   , "jnnp.bmj.com"
   , "jn.nutrition.org"
   , "johakyu.net"
   , "joshmitteldorf.scienceblog.com"
   , "jotengine.com"
   , "journals.ametsoc.org"
   , "journals.lww.com"
   , "journals.physiology.org"
   , "journals.sagepub.com"
   , "journaltimes.com"
   , "jpet.aspetjournals.org"
   , "jukebox.openai.com"
   , "justpaste.it"
   , "jwz.org"
   , "jyllands-posten.dk"
   , "kanzaki.sub.jp"
   , "kettl.co"
   , "kilthub.cmu.edu"
   , "knowyourmeme.com"
   , "koeln.ccc.de"
   , "kotaku.com"
   , "kyunghyuncho.me"
   , "lacbzxobeprssrfx.onion"
   , "lair.lighton.ai"
   , "lareviewofbooks.org"
   , "latanyasweeney.org"
   , "latimesblogs.latimes.com"
   , "latitude.io"
   , "ldsc.broadinstitute.org"
   , "leaderboard.allenai.org"
   , "leaps.org"
   , "learn.adafruit.com"
   , "learnyouahaskell.com"
   , "leme.me"
   , "letterformarchive.org"
   , "letters.temporarystate.net"
   , "libgen.org"
   , "library.bz"
   , "lichess.org"
   , "liebertpub.com"
   , "link.springer.com"
   , "linuxmafia.com"
   , "listserv.brown.edu"
   , "lists.urth.net"
   , "lists.wikimedia.org"
   , "listudy.org"
   , "lizadaly.com"
   , "lobste.rs"
   , "longbets.org"
   , "longnow.org"
   , "longreads.com"
   , "lostpinesyaupontea.com"
   , "lukemuehlhauser.com"
   , "lwn.net"
   , "machinelearning.apple.com"
   , "make.girls.moe"
   , "mangans.blogspot.com"
   , "marco.org"
   , "martinottaway.com"
   , "mathoverflow.net"
   , "math.stackexchange.com"
   , "mattsclancy.substack.com"
   , "mayoclinicproceedings.org"
   , "mbio.asm.org"
   , "meaningness.com"
   , "media.ccc.de"
   , "media.githubusercontent.com"
   , "media.nature.com"
   , "media.springernature.com"
   , "medicine.osu.edu"
   , "medieval.bodleian.ox.ac.uk"
   , "medium.com"
   , "medlineplus.gov"
   , "medsforbitcoin.com"
   , "meehl.umn.edu"
   , "mega.nz"
   , "meltingasphalt.com"
   , "messybeast.com"
   , "metacpan.org"
   , "metrics.torproject.org"
   , "millercenter.org"
   , "millionshort.com"
   , "mnemosyne-proj.org"
   , "money.cnn.com"
   , "mosaicscience.com"
   , "motherboard.vice.com"
   , "moz.com"
   , "mpra.ub.uni-muenchen.de"
   , "mru.org"
   , "mujoco.org"
   , "myanimelist.net"
   , "mymodafinil.net"
   , "mysbfiles.stonybrook.edu"
   , "naldc.nal.usda.gov"
   , "nansenundpiccard.de"
   , "nationalinterest.org"
   , "nces.ed.gov"
   , "nearcyan.com"
   , "nearlyfreespeech.net"
   , "nebia.com"
   , "nectarcreek.com"
   , "neomarxisme.com"
   , "neuralnetworksanddeeplearning.com"
   , "cognitivefun.net"
   , "newegg.com"
   , "newhumanist.org.uk"
   , "new.nubrain.com"
   , "newrepublic.com"
   , "news.bbc.co.uk"
   , "news.gallup.com"
   , "news.harvard.edu"
   , "news.mit.edu"
   , "newsroom.collegeboard.org"
   , "news.samsung.com"
   , "news.slashdot.org"
   , "news.yahoo.com"
   , "news.ycombinator.com"
   , "nicovideo.jp"
   , "nitro.biosci.arizona.edu"
   , "nitter.net"
   , "nixnote.org"
   , "nmteaco.com"
   , "n.neurology.org"
   , "nori.com"
   , "noscript.net"
   , "npc.people.com.cn"
   , "nrl.northumbria.ac.uk"
   , "nutritionj.biomedcentral.com"
   , "nypost.com"
   , "ods.od.nih.gov"
   , "oglaf.com"
   , "old.reddit.com"
   , "oll.libertyfund.org"
   , "omdia.tech.informa.com"
   , "omega0.xyz"
   , "omega.albany.edu:8008"
   , "onlinelibrary.wiley.com"
   , "openai.com"
   , "openaipublic.blob.core.windows.net"
   , "openreview.net"
   , "opensnp.org"
   , "opensource.org"
   , "orbis.stanford.edu"
   , "orbit.dtu.dk"
   , "osf.io"
   , "osnadocs.ub.uni-osnabrueck.de"
   , "otago.ourarchive.ac.nz"
   , "ourstarblazers.com"
   , "p2pfoundation.ning.com"
   , "packages.debian.org"
   , "pages.jh.edu"
   , "pain.wustl.edu"
   , "papers.nips.cc"
   , "paperswithcode.com"
   , "par.nsf.gov"
   , "partner.steamgames.com"
   , "pastebin.com"
   , "paste.laravel.io"
   , "patch.com"
   , "patch-tag.com"
   , "patents.google.com"
   , "pay.reddit.com"
   , "pcdb.santafe.edu"
   , "pcpartpicker"
   , "pcpartpicker.com"
   , "peerj.com"
   , "people.tamu.edu"
   , "perma.cc"
   , "permalink.gmane.org"
   , "phabricator.wikimedia.org"
   , "pharmacyreviewer.co"
   , "pharmrev.aspetjournals.org"
   , "philarchive.org"
   , "philsci-archive.pitt.edu"
   , "physics.aps.org"
   , "physicstoday.scitation.org"
   , "physoc.onlinelibrary.wiley.com"
   , "pingpong.ki.se"
   , "pioneer.app"
   , "pirate.london"
   , "pixelpoppers.com"
   , "pjreddie.com"
   , "play.aidungeon.io"
   , "player.vimeo.com"
   , "play.google.com"
   , "plaza.harmonix.ne.jp"
   , "plos"
   , "pluralsight.com"
   , "plus.google.com"
   , "pni.princeton.edu"
   , "poemanalysis.com"
   , "poets.org"
   , "pol.is"
   , "polisen.se"
   , "politicalscience.osu.edu"
   , "pone.dev"
   , "popcon.debian.org"
   , "popsych.org"
   , "poststar.com"
   , "pps.sagepub.com"
   , "practicaltypography.com"
   , "precedings.nature.com"
   , "predictionbook.com"
   , "press.etc.cmu.edu"
   , "priceonomics.com"
   , "prisons.org.uk"
   , "prize.hutter1.net"
   , "proceedings.neurips.cc"
   , "programmablesearchengine.google.com"
   , "projecteuclid.org"
   , "project-rainbowcrack.com"
   , "proofofexistence.com"
   , "psmag.com"
   , "pss.sagepub.com"
   , "psyarxiv.com"
   , "psychology.gatech.edu"
   , "psych.wustl.edu"
   , "psycnet.apa.org"
   , "publicdomainreview.org"
   , "publicsearch.ndcourts.gov"
   , "public.tableau.com"
   , "pubmed.ncbi.nlm.nih.gov"
   , "pubs.acs.org"
   , "pubs.aeaweb.org"
   , "pubsonline.informs.org"
   , "pulitzercenter.org"
   , "pure.au.dk"
   , "pure.tue.nl"
   , "pure.uva.nl"
   , "pure.uvt.nl"
   , "purse.io"
   , "qa.debian.org"
   , "qntm.org"
   , "quadrant.org.au"
   , "qualitysafety.bmj.com"
   , "quoteinvestigator.com"
   , "qz.com"
   , "rachelbythebay.com"
   , "radar.oreilly.com"
   , "radiopublic.com"
   , "raw.githubusercontent.com"
   , "rbej.biomedcentral.com"
   , "rd.springer.com"
   , "readonlymemory.vg"
   , "reason.com"
   , "repec.org"
   , "repository.si.edu"
   , "repository.uel.ac.uk"
   , "repository.upenn.edu"
   , "research.facebook.com"
   , "research.vu.nl"
   , "reset.me"
   , "r-inla.org"
   , "risk-engineering.org"
   , "ro.ecu.edu.au"
   , "royalsocietypublishing.org"
   , "rpubs.com"
   , "rss.onlinelibrary.wiley.com"
   , "runrepeat.com"
   , "samsaffron.com"
   , "scholar.google.com"
   , "scholar.harvard.edu"
   , "scienceblogs.com"
   , "science.nasa.gov"
   , "science.sciencemag.org"
   , "scp-wiki.wikidot.com"
   , "searchengineland.com"
   , "flickr.com"
   , "sembr.org"
   , "sensebridge.net"
   , "serendipityrecs.com"
   , "sethroberts.net"
   , "sgo.sagepub.com"
   , "siepr.stanford.edu"
   , "sigbovik.org"
   , "silkroad5v7dywlc.onion"
   , "silkroadvb5piz3r.onion"
   , "sites.google.com"
   , "sites.research.google"
   , "sive.rs"
   , "skeb.jp"
   , "skeptics.stackexchange.com"
   , "skift.com"
   , "skymind.ai"
   , "slashdot.org"
   , "slate.com"
   , "snopes.com"
   , "sociologicalscience.com"
   , "soundcloud.com"
   , "sourceforge.net"
   , "sparkfun.com"
   , "sparky.haskell.org"
   , "spectrum.ieee.org"
   , "spectrum.library.concordia.ca"
   , "spreadsheets.google.com"
   , "ssgac.org"
   , "sss.sagepub.com"
   , "stability.ai"
   , "stackexchange.com"
   , "stackoverflow.com"
   , "static-content.springer.com"
   , "stats.stackexchange.com"
   , "steamcommunity.com"
   , "stevecoast.com"
   , "store.steampowered.com"
   , "stripe.com"
   , "stroke.ahajournals.org"
   , "studenttheses.universiteitleiden.nl"
   , "subterraneanpress.com"
   , "suffolk.onthehub.com"
   , "summerofcode.withgoogle.com"
   , "sundhedsdatastyrelsen.dk"
   , "super.gluebenchmark.com"
   , "super-memory.com"
   , "superuser.com"
   , "support.google.com"
   , "support.mozilla.org"
   , "support.torproject.org"
   , "swombat.com"
   , "tails.boum.org"
   , "takimag.com"
   , "tasvideos.org"
   , "taylorandfrancis.com"
   , "teahabitat.com"
   , "tealet.com"
   , "techcrunch.com"
   , "tfhub.dev"
   , "thecatsite.com"
   , "thechineseteashop.com"
   , "thecleverest.com"
   , "thecodelesscode.com"
   , "theconversation.com"
   , "thecorrespondent.com"
   , "theeagle.com"
   , "thegradient.pub"
   , "thehub7dnl5nmcz5.onion"
   , "theintercept.com"
   , "themorningnews.org"
   , "thenextweb.com"
   , "thepiratebay.org"
   , "thesecatsdonotexist.com"
   , "thesession.org"
   , "thesocietypages.org"
   , "thessgac.org"
   , "thetakeout.com"
   , "thewebconf.org"
   , "thiscardoesnotexist"
   , "thismarketingblogdoesnotexist.com"
   , "thisponydoesnotexist.net"
   , "thisstorydoesnotexist.com"
   , "thisvesseldoesnotexist.com"
   , "thomasbarker.com"
   , "thoughtbot.com"
   , "tigersophia.blogspot.com"
   , "timarit.is"
   , "timesofindia.indiatimes.com"
   , "tineye.com"
   , "tinyletter.com"
   , "tinyurl.com"
   , "tl.net"
   , "t.ly"
   , "t.me"
   , "tobaccocontrol.bmj.com"
   , "today.yougov.com"
   , "tom7.org"
   , "top500.org"
   , "torch.ch"
   , "torservers.net"
   , "towardsdatascience.com"
   , "translate.google.com"
   , "treasurydirect.gov"
   , "trends.google.com"
   , "trialsjournal.biomedcentral.com"
   , "tribune.com.pk"
   , "truewetsuits.jp"
   , "tryhaskell.org"
   , "tuts4you.com"
   , "tvtropes.org"
   , "tweelingenregister.vu.nl"
   , "x.com"
   , "type-r.hatenablog.com"
   , "ubc-emotionlab.ca"
   , "uberty.org"
   , "uitspraken.rechtspraak.nl"
   , "uk.pi-supply.com"
   , "umichrl.pbworks.com"
   , "undark.org"
   , "understandinguncertainty.org"
   , "unesdoc.unesco.org"
   , "urth.net"
   , "uscourts.gov"
   , "us.dantelabs.com"
   , "usesthis.com"
   , "vanishingpoint.air-nifty.com"
   , "variety.com"
   , "vault.si.com"
   , "vgl.ucdavis.edu"
   , "vgmdb.net"
   , "vimeo.com"
   , "vinecon.ucdavis.edu"
   , "vision-explorer.allenai.org"
   , "vividness.live"
   , "vizhub.healthdata.org"
   , "vk.com"
   , "vndb.org"
   , "voxday.blogspot.com"
   , "waifu2x.udp.jp"
   , "waifulabs.com"
   , "wandb.ai"
   , "warosu.org"
   , "wcfcourier.com"
   , "wci.llnl.gov"
   , "web-archive-org.translate.goog"
   , "web-japan.org"
   , "web.maths.unsw.edu.au"
   , "web.mit.edu"
   , "websitedownloader.io"
   , "wellcomecollection.org"
   , "whatis.suburbansenshi.com"
   , "wiki.evageeks.org"
   , "wolframlpha.com"
   , "wordpress.org"
   , "works.bepress.com"
   , "worrydream.com"
   , "wudao.aminer.cn"
   , "ww2.arb.ca.gov"
   , "www0.us.ioccc.org"
   , "www.1001fonts.com"
   , "www108.lamp.le.ac.uk"
   , "www.1m.co"
   , "www2.bfi.org.uk"
   , "www2.ed.gov"
   , "www2.guidestar.org"
   , "www2.psy.uq.edu.au"
   , "www3.ntu.edu.sg"
   , "www.4nrx-uk.md"
   , "www.aaai.org"
   , "www.aaronsw.com"
   , "www.abbiotec.com"
   , "www.abc10.com"
   , "www.abc.net.au"
   , "www.abebooks.com"
   , "www.abetterpage.com"
   , "www.academia.edu"
   , "www.acpjournals.org"
   , "www.actionnewsnow.com"
   , "www.adafruit.com"
   , "www.advrider.com"
   , "www.aeaweb.org"
   , "www.aei.org"
   , "www.aera.net"
   , "www.afp.gov.au"
   , "www.afr.com"
   , "www.ahajournals.org"
   , "www.aiwriter.email"
   , "www.ajmadison.com"
   , "www.ajnr.org"
   , "www.alchemistowl.org"
   , "www.alljapaneseallthetime.com"
   , "www.alphagomovie.com"
   , "www.alternatehistory.com"
   , "www.alzchem.com"
   , "www.alzforum.org"
   , "www.ama-assn.org"
   , "www.amazon.co.jp"
   , "www.amazon.com"
   , "www.ams.org"
   , "www.anandtech.com"
   , "www.angelfire.com"
   , "www.animenewsnetwork.com"
   , "www.anime-planet.com"
   , "www.annualreviews.org"
   , "www.antonhowes.com"
   , "www.apa.org"
   , "www.arkansasonline.com"
   , "www.arknights.global"
   , "www.army.mil"
   , "www.artbreeder.com"
   , "www.artofmanliness.com"
   , "www.arxiv-vanity.com"
   , "www.atlasobscura.com"
   , "www.atsjournals.org"
   , "www.avalonmagicplants.com"
   , "www.avclub.com"
   , "www.awe.gov.au"
   , "www.backblaze.com"
   , "www.baen.com"
   , "www.baltcoffee.com"
   , "www.barnesandnoble.com"
   , "www.barnstormjournal.org"
   , "www.bartokdesign.com"
   , "www.bbc.com"
   , "www.bbc.co.uk"
   , "www.beelinereader.com"
   , "www.behance.net"
   , "www.belfastlive.co.uk"
   , "www.ben-evans.com"
   , "www.berkshireeagle.com"
   , "www.berkshirehathaway.com"
   , "www.berlin.de"
   , "www.betterworldbooks.com"
   , "www.bfi.org"
   , "www.bfmtv.com"
   , "www-biba.inrialpes.fr"
   , "www.biorxiv.org"
   , "www.birminghammail.co.uk"
   , "www.bizjournals.com"
   , "www.blender.org"
   , "www.blockchain.com"
   , "www.blog.sethroberts.net"
   , "www.bloomberg.com"
   , "www.bls.gov"
   , "www.bmj.com"
   , "www.bnlearn.com"
   , "www.brandonsanderson.com"
   , "www.broadinstitute.org"
   , "www.bronxbanterblog.com"
   , "www.bulletproof.com"
   , "www.businessinsider.com"
   , "www.businessinsider.jp"
   , "www.businesswire.com"
   , "www.buttercupfestival.com"
   , "www.buzzfeed.com"
   , "www.buzzfeednews.com"
   , "www.bvp.com"
   , "www.byrnehobart.com"
   , "www.cabinetmagazine.org"
   , "www.calnewport.com"
   , "www.cambridge.org"
   , "www.campbellrivermirror.com"
   , "www.cancer.gov"
   , "www.cancerresearchuk.org"
   , "www.cap-lore.com"
   , "www.carolinacoastonline.com"
   , "www.catb.org"
   , "www.cato.org"
   , "www.cebm.ox.ac.uk"
   , "www.cehd.umn.edu"
   , "www.cell.com"
   , "www.census.gov"
   , "www.change.org"
   , "www.channel4.com"
   , "www.chathamstartribune.com"
   , "www.chemistryworld.com"
   , "www.chessclub.com"
   , "www.chess.com"
   , "www.chicagobooth.edu"
   , "www.chinafile.com"
   , "www.chronicle.com"
   , "www.churchofjesuschrist.org"
   , "www.cisco.com"
   , "www.citizenaudit.org"
   , "www.city-journal.org"
   , "www.clippershipteaco.com"
   , "www.clubindustry.com"
   , "www.cmajopen.ca"
   , "www.cmu.edu"
   , "www.cnbc.com"
   , "wwwcn.cs.uni-duesseldorf.de"
   , "www.cnet.com"
   , "www.cochranelibrary.com"
   , "www.codespaces.com"
   , "www.collisiondetection.net"
   , "www.comicbox.co.jp"
   , "www.comicconnect.com"
   , "www.computerworld.com"
   , "www.consumerlab.com"
   , "www.copenhagenconsensus.com"
   , "www.copyright.gov"
   , "www.counterpunch.org"
   , "www.coursera.org"
   , "www.courtlistener.com"
   , "www.courts.mo.gov"
   , "www.courts.sa.gov.au"
   , "www.cracked.com"
   , "www.cram.com"
   , "www.crd.york.ac.uk"
   , "www.csail.mit.edu"
   , "www.cs.cornell.edu"
   , "www.cs.purdue.edu"
   , "www.csub.edu"
   , "www.cs.utexas.edu"
   , "www.cs.york.ac.uk"
   , "www.dailyfinance.com"
   , "www.dailystar.co.uk"
   , "www.dantelabs.com"
   , "www.darkowl.com"
   , "www.dcscience.net"
   , "www.dea.gov"
   , "www.deepmind.com"
   , "www.delawareonline.com"
   , "www.designboom.com"
   , "www.detectiveconanworld.com"
   , "www.devever.net"
   , "www.deviantart.com"
   , "www.dharmaoverground.org"
   , "www.dichtbij.nl"
   , "www.discovermagazine.com"
   , "www.ditext.com"
   , "www.dobuusagi.com"
   , "www.dr.dk"
   , "www.dropbox.com"
   , "www.drugs.com"
   , "www.drugsdata.org"
   , "www.dtic.mil"
   , "www.dummy-system.com"
   , "www.duolingo.com"
   , "www.ebay.com"
   , "www.ebay.co.uk"
   , "www.ecns.cn"
   , "www.ed.ac.uk"
   , "www.edge.org"
   , "www.eetimes.com"
   , "www.effectuation.org"
   , "www.elastic.co"
   , "www.elon.edu"
   , "www.emacswiki.org"
   , "www.emcdda.europa.eu"
   , "www.energy.gov"
   , "www.engadget.com"
   , "www.english.upenn.edu"
   , "www.enworld.org"
   , "www.eoht.info"
   , "www.epjournal.net"
   , "www.equilibretechnologies.com"
   , "www.eric.ed.gov"
   , "www.erowid.org"
   , "www.e-sanitas.edu.co"
   , "www.escholar.manchester.ac.uk"
   , "www.esquire.com"
   , "www.eurekalert.org"
   , "www.eurojust.europa.eu"
   , "www.eusprig.org"
   , "www.evalegend.com"
   , "www.ex.org"
   , "www.expert-reviews.com"
   , "www.expressandstar.com"
   , "www.express.co.uk"
   , "www.facebook.com"
   , "www.fanfiction.net"
   , "www.faqs.org"
   , "www.fasebj.org"
   , "www.fastcompany.com"
   , "www.fda.gov"
   , "www.ff7citadel.com"
   , "www.fightaging.org"
   , "www.fimfiction.net"
   , "www.fincen.gov"
   , "www.findagrave.com"
   , "www.firstthings.com"
   , "www.flashback.org"
   , "www.flashgamehistory.com"
   , "www.flickr.com"
   , "www.foliosociety.com"
   , "www.fool.com"
   , "www.forbes.com"
   , "www.fordfoundation.org"
   , "www.foreignaffairs.com"
   , "www.fox6now.com"
   , "www.foxcarolina.com"
   , "www.foxnews.com"
   , "www.frbsf.org"
   , "www.freehaven.net"
   , "www.frontiersin.org"
   , "www.fs.fed.us"
   , "www.fsigenetics.com"
   , "www.ftc.gov"
   , "www.garda.ie"
   , "www.genome.gov"
   , "www.genwaybio.com"
   , "www.getlamp.com"
   , "www.girlschase.com"
   , "www.girlscouts.org"
   , "www.globaltimes.cn"
   , "www.global.toshiba"
   , "www.gloucestershirelive.co.uk"
   , "www.gnu.org"
   , "www.goodreads.com"
   , "www.goodtherapy.org"
   , "www.google.com"
   , "www.goproblems.com"
   , "www.gov.uk"
   , "www.greenexercise.org"
   , "www.gsb.stanford.edu"
   , "www.guilford.com"
   , "www.hakalalabs.com"
   , "www.hanselman.com"
   , "www.harney.com"
   , "www.harvardmagazine.com"
   , "www.haskell.org"
   , "www.heraldnews.com"
   , "www.highbeam.com"
   , "www.highflightfoundation.org"
   , "www.hindustantimes.com"
   , "www.history.com"
   , "www.historytoday.com"
   , "www.holidaymead.com"
   , "www.hoover.org"
   , "www.hrw.org"
   , "www.htrnews.com"
   , "www.huffpost.com"
   , "www.ibtimes.co.uk"
   , "www.ice.gov"
   , "www.idnes.cz"
   , "www.ietf.org"
   , "www.iflscience.com"
   , "www.iherb.com"
   , "www.illumina.com"
   , "www.imagesco.com"
   , "www.imdb.com"
   , "www.imf.org"
   , "www.imminst.org"
   , "www.impactcybertrust.org"
   , "www.inc.com"
   , "www.independent.co.uk"
   , "www.indiana.edu"
   , "www.industrydocuments.ucsf.edu"
   , "www.infinitychess.com"
   , "www.infinityplus.co.uk"
   , "www.infoplease.com"
   , "www.informit.com"
   , "www.inputmag.com"
   , "www.insidehighered.com"
   , "www.instagram.com"
   , "www.instructables.com"
   , "www.intel.com"
   , "www.iqout.com"
   , "www.irishcentral.com"
   , "www.irishexaminer.com"
   , "www.irishtimes.com"
   , "www.irrodl.org"
   , "www.isfdb.org"
   , "www.ivfbabble.com"
   , "www.jacc.org"
   , "www.jackkinsella.ie"
   , "www.jacurutu.com"
   , "www.jameslindlibrary.org"
   , "www.janelia.org"
   , "www.japantimes.co.jp"
   , "www.jetbrains.com"
   , "www.jneurosci.org"
   , "www.joshdean.com"
   , "www.journalnow.com"
   , "www.jstage.jst.go.jp"
   , "www.jstatsoft.org"
   , "www.jstor.org"
   , "www.justice.gov"
   , "www.jwz.org"
   , "www.kadokawa.co.jp"
   , "www.kaggle.com"
   , "www.kctv5.com"
   , "www.kgw.com"
   , "www.khara.co.jp"
   , "www.kickstarter.com"
   , "www.kokos.cz"
   , "www.kptv.com"
   , "www.labone.tech"
   , "www.lanl.gov"
   , "www.laphamsquarterly.org"
   , "www.latimes.com"
   , "www.law.cornell.edu"
   , "www.lef.org"
   , "www.lemonde.fr"
   , "www.leontiadis.info"
   , "www.liebertpub.com"
   , "www.lightspeedmagazine.com"
   , "www.limeadery.com"
   , "www.linode.com"
   , "www.l-iz.de"
   , "www.loc.gov"
   , "www.locusmag.com"
   , "www.longecity.org"
   , "www.longevityhistory.com"
   , "www.loudountimes.com"
   , "www.lrb.co.uk"
   , "www.lshtm.ac.uk"
   , "www.lyrn.ai"
   , "www.maa.org"
   , "www.macrumors.com"
   , "www.madboa.com"
   , "www.manchestereveningnews.co.uk"
   , "www.mangauk.com"
   , "www.mangaupdates.com"
   , "www.mansfieldnewsjournal.com"
   , "www.marxists.org"
   , "www.mathematica.org"
   , "www.mayoclinic.org"
   , "www.mayoclinicproceedings.org"
   , "www.mcsweeneys.net"
   , "www.mdpi.com"
   , "www.mediafire.com"
   , "www.medicaldaily.com"
   , "www.medicines.org.uk"
   , "www.medrxiv.org"
   , "www.megaverse.info"
   , "www.mercatus.org"
   , "www.mesacc.edu"
   , "www.metaculus.com"
   , "www.mha.gov.sg"
   , "www.mhlw.go.jp"
   , "www.microsoft.com"
   , "www.millionshort.com"
   , "www.mindsparke.com"
   , "www.mining.com"
   , "www.mirror.co.uk"
   , "www.mit.edu"
   , "www.mja.com.au"
   , "www.mobihealthnews.com"
   , "www.moma.org"
   , "www.morinaga.co.jp"
   , "www.msri.org"
   , "www.muckrock.com"
   , "www.myfonts.com"
   , "www.nap.edu"
   , "www.nationaldefensemagazine.org"
   , "www.nato.int"
   , "www.nature.com"
   , "www.nausicaa.net"
   , "www.nba.com"
   , "www.nber.org"
   , "www.nbr.co.nz"
   , "www.ncbi.nlm.nih.gov"
   , "www.ndss-symposium.org"
   , "www.nearlyfreespeech.net"
   , "www.nejm.org"
   , "www.neuroscience.cam.ac.uk"
   , "www.newadvent.org"
   , "www.newegg.com"
   , "www.newscientist.com"
   , "www.newstatesman.com"
   , "www.newsweek.com"
   , "www.newyorker.com"
   , "www.newyorkfed.org"
   , "www.nextnewdeal.net"
   , "www.nicovideo.jp"
   , "www.nicvape.com"
   , "www.nimh.nih.gov"
   , "www.nitrd.gov"
   , "www.nlsinfo.org"
   , "www.nngroup.com"
   , "www.nobelprize.org"
   , "www.nola.com"
   , "www.northjersey.com"
   , "www.northwestgeorgianews.com"
   , "www.notion.so"
   , "www.nrdc.org"
   , "www.nsa.gov"
   , "www.ntticc.or.jp"
   , "nyaa.si"
   , "www.nybooks.com"
   , "www.nytimes.com"
   , "www.nzherald.co.nz"
   , "www.odt.co.nz"
   , "www.oglaf.com"
   , "www.ohri.ca"
   , "www.olin.edu"
   , "www.oliverwinery.com"
   , "www.om.nl"
   , "www.openphilanthropy.org"
   , "www.optimizely.com"
   , "www.optimox.com"
   , "www.oreilly.com"
   , "www.osti.gov"
   , "www.outsideonline.com"
   , "www.overcomingbias.com"
   , "www.overthinkingit.com"
   , "www.packtpub.com"
   , "www.patreon.com"
   , "www.pbs.org"
   , "www.pcworld.com"
   , "www.petcarerx.com"
   , "www.petco.com"
   , "www.peterbloem.nl"
   , "www.petforums.co.uk"
   , "www.phillymag.com"
   , "www.pixiv.net"
   , "www.pluralsight.com"
   , "www.plymouthherald.co.uk"
   , "www.pnas.org"
   , "www.poetrynook.com"
   , "www.politie.nl"
   , "www.polizei.bayern.de"
   , "www.polizei.sachsen.de"
   , "www.polygon.com"
   , "www.popularmechanics.com"
   , "www.postandcourier.com"
   , "www.preclinicaltrials.eu"
   , "www.pressandjournal.co.uk"
   , "www.prnewswire.com"
   , "www.progressive.org"
   , "www.projectrho.com"
   , "www.proofofexistence.com"
   , "www.propublica.org"
   , "www.prospecbio.com"
   , "www.protoculture.ca"
   , "www.psychologicalscience.org"
   , "www.psychologytoday.com"
   , "www.quantamagazine.org"
   , "www.quora.com"
   , "www.rand.org"
   , "www.ratbehavior.org"
   , "www.rbmojournal.com"
   , "www.rean-wings.net"
   , "www.rechem.ca"
   , "www.reddit.com"
   , "www.redliongrantchester.co.uk"
   , "www.replicatedtypo.com"
   , "www.repository.cam.ac.uk"
   , "www.rescuetime.com"
   , "www.researchandmarkets.com"
   , "www.researchgate.net"
   , "www.research.va.gov"
   , "www.rightstufanime.com"
   , "www.r-inla.org"
   , "www.roangelo.net"
   , "www.rocketpunk-manifesto.com"
   , "www.rollingstone.com"
   , "www.rrauction.com"
   , "www.rsm.nl"
   , "www.rte.ie"
   , "www.rug.nl"
   , "www.salesforce.com"
   , "www.samharris.org"
   , "www.sandia.gov"
   , "www.scholarpedia.org"
   , "www.sciencedaily.com"
   , "www.sciencedirect.com"
   , "www.sciencemag.org"
   , "www.science.org"
   , "www.scientificamerican.com"
   , "www.scifiscripts.com"
   , "www.scmp.com"
   , "www.scotthyoung.com"
   , "www.scq.ubc.ca"
   , "www.screendaily.com"
   , "www.sdfertility.com"
   , "www.seacoastonline.com"
   , "www.sebastianmarshall.com"
   , "www.sec.gov"
   , "www.seistronix.com"
   , "www.semanticscholar.org"
   , "www.sendspace.com"
   , "www.sequentialtart.com"
   , "www.sethroberts.net"
   , "www.sfawardswatch.com"
   , "www.shine.cn"
   , "www.shroomery.org"
   , "www.si.edu"
   , "www.simonsfoundation.org"
   , "www.slideshare.net"
   , "www.smarternootropics.com"
   , "www.smartpowders.com"
   , "www.smbc-comics.com"
   , "www.smh.com.au"
   , "www.smithsonianmag.com"
   , "www.snopes.com"
   , "www.snpp.com"
   , "www.soci.org"
   , "www.sophos.com"
   , "www.southwales-eveningpost.co.uk"
   , "www.spacedrepetition.com"
   , "www.sparkfun.com"
   , "www.spectator.co.uk"
   , "www.speedtest.net"
   , "www.spermbankcalifornia.com"
   , "www.spiceandtea.com"
   , "www.ssa.gov"
   , "www.ssi.shimadzu.com"
   , "www.startupschool.org"
   , "www.stat.colostate.edu"
   , "www.stats.govt.nz"
   , "www.stevepetersen.net"
   , "www.stroudnewsandjournal.co.uk"
   , "www.stuartcheshire.org"
   , "www.sudowrite.com"
   , "www.supermemo.com"
   , "www.tabletmag.com"
   , "www.tandfonline.com"
   , "www.taylorusa.com"
   , "www.teamten.com"
   , "www.teasetc.com"
   , "www.teavana.com"
   , "www.technologyreview.com"
   , "www.ted.com"
   , "www.teds.ac.uk"
   , "www.telegraph.co.uk"
   , "www.tennessean.com"
   , "www.tensorflow.org"
   , "www.tga.gov.au"
   , "www.theadvertiser.com"
   , "www.theage.com.au"
   , "www.theannals.com"
   , "www.theatlantic.com"
   , "www.thedailybeast.com"
   , "www.thediff.co"
   , "www.theguardian.com"
   , "www.thehomesecuritysuperstore.com"
   , "www.theladders.com"
   , "www.thelancet.com"
   , "www.thelocal.de"
   , "www.themarshallproject.org"
   , "www.thenewatlantis.com"
   , "www.theonion.com"
   , "www.theringer.com"
   , "www.theroot.com"
   , "www.the-scientist.com"
   , "www.thessgac.org"
   , "www.thestar.com"
   , "www.thetimes.co.uk"
   , "www.the-tls.co.uk"
   , "www.theverge.com"
   , "www.thisamericanlife.org"
   , "www.thisstorydoesnotexist.com"
   , "www.thoughtco.com"
   , "www.thv11.com"
   , "www.ti.com"
   , "www.timeanddate.com"
   , "www.timesofisrael.com"
   , "www.tinyletter.com"
   , "www.tn.gov"
   , "www.tomshardware.com"
   , "www.topic.com"
   , "www.toplessrobot.com"
   , "www.torproject.org"
   , "www.torservers.net"
   , "www.townandcountrymag.com"
   , "www.treasurydirect.gov"
   , "www.trixietracker.com"
   , "www.tryhaskell.org"
   , "www.tuftandneedle.com"
   , "www.tweaktown.com"
   , "www.twitch.tv"
   , "www.typografie.info"
   , "www.typography.com"
   , "www.uber.com"
   , "www.ukbiobank.ac.uk"
   , "www.unitedpharmacies-uk.md"
   , "www.upi.com"
   , "www.upjohn.org"
   , "www.uptontea.com"
   , "www.urth.net"
   , "www.usagi.org"
   , "www.uscourts.gov"
   , "www.usenix.org"
   , "www.usgs.gov"
   , "www.uso.org"
   , "www.uv.es"
   , "www.verywellhealth.com"
   , "www.vg.no"
   , "www.vice.com"
   , "www.vitacost.com"
   , "www.vox.com"
   , "www.wahpetondailynews.com"
   , "www.walesonline.co.uk"
   , "www.walmart.com"
   , "www.wangafu.net"
   , "www.washingtonexaminer.com"
   , "www.washingtonpost.com"
   , "www.watercoolertrivia.com"
   , "www.wcscanada.org"
   , "www.wdaz.com"
   , "www.wdrb.com"
   , "www.webcitation.org"
   , "www.weidai.com"
   , "www.weizmann.ac.il"
   , "www.welt.de"
   , "www.whio.com"
   , "www.whirlpool.com"
   , "www.who.int"
   , "www.wickedlocal.com"
   , "wikiwix.com"
   , "www.willatworklearning.com"
   , "www.williamsburgmarketplace.com"
   , "www.williamsondailynews.com"
   , "www.wine-searcher.com"
   , "www.winonadailynews.com"
   , "www.wireheading.com"
   , "www.wnycstudios.org"
   , "www.wolframalpha.com"
   , "worksinprogress.co"
   , "www.worldcat.org"
   , "www.wunderground.com"
   , "www.wzzm13.com"
   , "www.xilinx.com"
   , "www.xinhuanet.com"
   , "www.xn--4dbcyzi5a.com"
   , "www.ycombinator.com"
   , "wyclif.substack.com"
   , "yourmorals.org"
   , "yp.flutterguy.org"
   , "yunnansourcing.com"
   , "yunnansourcing.us"
   , "zerocoin.org"
   , "z-lib.is"
   , "academic.oup.com"
   , "journals.biologists.com"
   , "github.blog"
   , "diabetesjournals.org"
   , "boards.fireden.net"
   , "archive.ph"
   , "pediatrics.aappublications.org"
   , "incompleteideas.net"
   , "www.incompleteideas.net"
   , "www.harvey.ai"
   , "www.reuters.com"
   , "www.biology.ualberta.ca"
   , "cvm.missouri.edu"
   , "data.bls.gov"
   , "jov.arvojournals.org"
   , "discoverbooks.com"
   , "www.fathomevents.com"
   , "www.iarpa.gov"
   , "www.rosebud.ai"
   , "karger.com"
   , "www.davidsongifted.org"
   , "www.project-imas.com"
   , "vitalik.eth.limo"
   , "memteaimports.com"
   , "garote.bdmonkeys.net"
   , "diff.wikimedia.org"
   , "animate-your-word.github.io"
   , "iodineresearch.com"
   , "members.madasafish.com"
   , "3quarksdaily.com"
   , "blog.daviskedrosky.com"
   , "civitai.com"
   , "classic.clinicaltrials.gov"
   , "cwe.mitre.org"
   , "deepmind.google"
   , "figshare.com"
   , "fonts.google.com"
   , "learn.microsoft.com"
   , "nap.nationalacademies.org"
   , "news.microsoft.com"
   , "platform.openai.com"
   , "psychology.wvu.edu"
   , "pubs.aip.org"
   , "shs.hal.science"
   , "solar.lowtechmagazine.com"
   , "supp.apa.org"
   , "tim.blog"
   , "training.cochrane.org"
   , "www.anthropic.com"
   , "www.clinicaltrialsregister.eu"
   , "www.crunchbase.com"
   , "www.daviddarling.info"
   , "www.genecards.org"
   , "www.henrikkarlsson.xyz"
   , "www.inverse.com"
   , "www.journals.uchicago.edu"
   , "www.linkedin.com"
   , "www.noahpinion.blog"
   , "www.robots.ox.ac.uk"
   , "www.theinformation.com"
   , "www.theintrinsicperspective.com"
   , "www.tiktok.com"
   , "www.whitehouse.gov"
   , "www.yahoo.com"
   , "zenodo.org"
   , "apnews.com"
   , "research.com"
   , "research.google"
   , "allenai.org"
   , "dnstats.net"
   , "en.bitcoin.it"
   , "humanvarieties.org"
   , "kill-the-newsletter.com"
   , "marginalrevolution.com"
   , "philpapers.org"
   , "readwrite.com"
   , "statmodeling.stat.columbia.edu"
   , "www.otakustudy.com"
   , "www.politico.com"
   , "www.theparisreview.org"
   , "www.axios.com"
   , "mhooten.github.io"
   , "blog.novelai.net"
   , "medicalxpress.com"
   , "phys.org"
   , "www.bartleby.com"
   , "ki.se"
   , "pmc.ncbi.nlm.nih.gov"
   , "www.manifold1.com"
   , "www.dwarkesh.com"
   , "jamanetwork.com"
   , "www.midjourney.com"
   , "www.mrc-epid.cam.ac.uk"
   , "wiki.c2.com"
   , "www.wsj.com"
   , "scholarship.law.upenn.edu"
   , "neojaponisme.com"
   , "www.larryniven.net"
   , "www.cs.ox.ac.uk"
   , "www.librarything.com"
   , "www.cia.gov"
   , "www.lifeview.com"
   , "www.statnews.com"
   , "www.dhammawiki.com"
   , "docs.midjourney.com"
   , "reactormag.com"
   , "www.w3.org"
   , "en.wikifur.com"
   , "ew.com"
   , "fibery.io"
   , "freakonomics.com"
   , "antifandom.com"
   ]

-- tested using `isURL` in `LinkLive` & are unique lists:
goodLinks = setLike
          [ "https://aleph.se/andart2/neuroscience/energetics-of-the-brain-and-ai/"
            , "https://beza1e1.tuxen.de/articles/accidentally_turing_complete.html"
            , "https://courses.csail.mit.edu/6.857/2012/files/nash.py"
            , "https://datacolada.org/"
            , "https://diyhpl.us/wiki/transcripts/hgp-write/2016-05-10/ultra-safe-cell-line/"
            , "https://dwarffortresswiki.org/index.php/User:BaronW#The_Almighty_Dwarven_Calculator"
            , "https://evaotaku.com/html/programbooks.html"
            , "https://forre.st/storage#hdd"
            , "https://google-summer-of-code-2009-haskell.googlecode.com/files/Niklas_Broberg.tar.gz"
            , "https://inhumanexperiment.blogspot.com/2009/03/increasing-intelligence-by-playing.html"
            , "https://jakewestfall.org/"
            , "https://langsec.org/"
            , "https://libgen.li/scimag/"
            , "https://mattmahoney.net/dc/dce.html"
            , "https://norvig.com/norvigs-law.html"
            , "https://ohtori.nu/creators/contributors.html"
            , "https://programme.exordo.com/isir2017/delegates/presentation/29/"
            , "https://blondihacks.com/furiosas-cat-feeder/"
            , "https://r6.ca/blog/20090522T015739Z.html"
            -- , "https://1dollarscan.com/"
            , "https://80000hours.org/podcast/episodes/brian-christian-algorithms-to-live-by/"
            , "https://abandonedfootnotes.blogspot.com/2011/04/qaddafis-chickens.html"
            , "https://abcnews.go.com/Business/steve-jobs-death-billions-remain-private-topic/story?id=14682218"
            , "https://abcnotation.com/wiki/abc:standard:v2.1#comments_and_remarks"
            , "https://about.google/"
            , "https://academictorrents.com/details/0d366035664fdf51cfbe9f733953ba325776e667/tech"
            , "https://aclanthology.org/D15-1002/"
            , "https://ageofem.com/"
            , "https://agtb.wordpress.com/2012/02/17/john-nashs-letter-to-the-nsa/#comment-5458"
            , "https://static.googleusercontent.com/media/research.google.com/en//pubs/archive/46180.pdf"
            , "https://aiimpacts.org/wp-content/uploads/2019/02/image2.png"
            , "https://alexanderetz.com/2015/08/30/the-bayesian-reproducibility-project/"
            -- , "https://altjapan.typepad.com/my_weblog/2007/05/better_stronger.html" -- spoofing fake 403 errors
            , "https://andrewmayne.com/2020/07/08/openai-api-alchemy-turn-a-script-into-a-novel-and-vice-versa/"
            , "https://andymatuschak.org/"
            , "https://andzuck.com/blog/sfw/"
            , "https://animekritik.wordpress.com/2011/12/03/imperialism-translation-gunbuster-episode-five/"
            , "https://ansuz.sooke.bc.ca/entry/23"
            , "https://apenwarr.ca/log/?m=201707#04"
            , "https://arbtt.nomeata.de/"
            , "https://web.archive.org/web/20250126173106/https://architext.design/about/"
            , "https://archivebox.io/"
            , "https://archive.nytimes.com/6thfloor.blogs.nytimes.com/2013/03/20/a-sham-procedure-leads-to-disappointing-m-s-news/"
            , "https://archive.nytimes.com/bits.blogs.nytimes.com/2012/06/07/good-night-moon-good-night-little-bird/"
            , "https://archive.nytimes.com/dealbook.nytimes.com/2011/09/03/the-survivor-who-saw-the-future-for-cantor-fitzgerald/"
            , "https://archive.nytimes.com/opinionator.blogs.nytimes.com/2009/11/24/the-end-of-music/"
            , "https://archive.nytimes.com/scientistatwork.blogs.nytimes.com/2012/09/06/lost-in-time-in-the-antarctic-ice-age/"
            , "https://archive.nytimes.com/well.blogs.nytimes.com/2009/06/08/worries-about-antioxidant-use-by-breast-cancer-patients/"
            , "https://archive.nytimes.com/www.nytimes.com/books/first/b/budiansky-lion.html"
            , "https://archive.seattletimes.com/archive/?date=19930513&slug=1701067"
            , "https://arima.cylab.cmu.edu/markets/cybercrime.php"
            , "https://arr.am/2020/07/14/elon-musk-by-dr-seuss-gpt-3/"
            , "https://asktog.com/atc/the-third-user/"
            , "https://bair.berkeley.edu/blog/2020/07/11/auction/"
            , "https://beepb00p.xyz/pkm-search.html#appendix_cloudmacs"
            , "https://behavioralscientist.org/mindware-the-high-cost-of-not-doing-experiments/"
            , "https://bellard.org/jslinux/tech.html"
            , "https://bitcoin-otc.com/"
            , "https://bldgblog.com/2017/01/the-season-of-burning-trucks/"
            , "https://blog.8faces.com/post/132017260619/eric-gill-advance"
            , "https://blog.beeminder.com/hieroglyphs/"
            , "https://blog.codinghorror.com/why-cant-programmers-program/"
            , "https://blog.cr.yp.to/20151120-batchattacks.html"
            , "https://blog.cryptographyengineering.com/2013/04/11/zerocoin-making-bitcoin-anonymous/"
            , "https://blog.csdn.net/DLW__/article/details/104243506"
            , "https://blog.eleuther.ai/factored-cognition/"
            , "https://blog.ethereum.org/2014/07/05/stake"
            , "https://blog.google/outreach-initiatives/small-business/google-ads-helping-businesses/"
            , "https://blog.nuclearsecrecy.com/2013/05/17/the-price-of-the-manhattan-project/"
            , "https://blog.otoro.net/2017/11/12/evolving-stable-strategies/"
            , "https://blog.regehr.org/archives/861"
            , "https://blogs.lanecc.edu/dhatthecc/wp-content/uploads/sites/28/2015/06/Moretti-Slaughterhouse-of-Lit.pdf"
            , "https://blog.thinkst.com/p/if-nsa-has-been-hacking-everything-how.html?m=1"
            , "https://blog.youtube/news-and-events/five-stars-dominate-ratings/"
            , "https://bmk.sh/2020/08/17/Building-AGI-Using-Language-Models/"
            -- , "https://boingboing.net/2012/08/09/make-yourself-healthy-searchi.html" -- spoofing fake 403 errors
            , "https://bwc.thelab.dc.gov/"
            , "https://cacm.acm.org/research/the-science-of-brute-force/"
            , "https://caniuse.com/?search=hyphenate"
            , "https://carbonplan.org/research/forest-offsets"
            , "https://casual-effects.com/markdeep/"
            , "https://catonmat.net/proof-that-sed-is-turing-complete"
            , "https://cdn.openai.com/API/English_Bash_Python.mp4"
            , "https://cognitivemedium.com/vme"
            , "https://commons.wikimedia.org/wiki/Category:Variations_on_the_national_flag_of_Japan"
            , "https://compdemocracy.org/algorithms/"
            , "https://complearn.org/thesis.html"
            , "https://conifer.rhizome.org/"
            , "https://corpgov.law.harvard.edu/2017/01/31/the-common-law-corporation-the-power-of-the-trust-in-anglo-american-business-history/"
            , "https://cran.r-project.org/web/packages/BradleyTerry2/index.html"
            , "https://crookedtimber.org/2012/05/30/in-soviet-union-optimization-problem-solves-you/#comment-415931"
            , "https://cs.stanford.edu/people/karpathy/reinforcejs/gridworld_dp.html"
            , "https://ctan.org/pkg/yinit"
            , "https://daniellakens.blogspot.com/2017/07/impossibly-hungry-judges.html"
            , "https://danluu.com/input-lag/"
            , "https://danwang.co/college-girardian-terror/"
            , "https://dataprivacylab.org/dataprivacy/projects/ssnwatch/index.html"
            , "https://davidepstein.com/david-epstein-the-sports-gene/"
            , "https://defector.com/in-the-future-of-collecting-is-anyone-having-fun"
            , "https://demos.obormot.net/these-waifus-do-not-exist-v2-alt"
            , "https://digital.library.unt.edu/explore/partners/TAMS/browse/?q=%22Julian+Stanley%22+OR+%22SMPY%22&sort=date_a&t=fulltext"
            , "https://distill.pub/2017/aia/"
            , "https://docs.google.com/document/d/1MhA3M5ucBD7ZXcWk57_MKZ5jEgPX6_YiKye_EFP-adg/edit"
            , "https://dominiccummings.com/2019/03/01/on-the-referendum-31-project-maven-procurement-lollapalooza-results-nuclear-agi-safety/"
            , "https://donsbot.com/2007/05/17/roll-your-own-window-manager-tracking-focus-with-a-zipper/"
            , "https://hackage.haskell.org/package/base-4.19.1.0/docs/Prelude.html#v:until"
            , "https://dresdencodak.com/2009/09/22/caveman-science-fiction/"
            , "https://dumps.wikimedia.org/enwiki/latest/"
            , "https://e2eml.school/transformers.html"
            , "https://egamebook.com/lochness/"
            , "https://eileenormsby.com/2013/09/26/the-fall-of-atlantis-a-moderator-tells/"
            , "https://eli.thegreenplace.net/2007/06/28/sicp-section-122/"
            , "https://emilkirkegaard.dk/en/2015/10/polygenic-traits-and-the-distribution-of-effect-sizes-years-of-education-from-rietveld-et-al-2013/"
            , "https://energycontrol.org/quienes-somos/proyectos/"
            , "https://engineering.fb.com/2017/06/14/ml-applications/deal-or-no-deal-training-ai-bots-to-negotiate/"
            , "https://enki2.tumblr.com/stories"
            , "https://en.wikibooks.org/wiki/Category:Book:Accountancy"
            , "https://en.wikichip.org/wiki/intel/core_i9/i9-7900x"
            , "https://en.wikipedia.org/wiki/Talk:Small_caps"
            , "https://en.wikipedia.org/wiki/User:Gwern"
            , "https://en.wikiquote.org/wiki/Tao_Te_Ching"
            , "https://en.wikisource.org/wiki/Meditation_XVII"
            , "https://en.wiktionary.org/wiki/steward#Etymology"
            , "https://eprint.iacr.org/2021/1273"
            , "https://equilibriabook.com/molochs-toolbox/"
            , "https://esolangs.org/wiki/Linear_bounded_automaton"
            , "https://etienne.se/cfnse/"
            , "https://eukaryotewritesblog.com/2017/06/30/book-review-barriers/"
            , "https://eva-fan.com/blog-entry-1198.html"
            , "https://exac.broadinstitute.org/faq"
            , "https://explorabl.es/"
            , "https://extras.denverpost.com/stateofhope/"
            , "https://familiarcycle.net/2020/how-to-finetune-gpt2-on-podcast-transcripts"
            , "https://fastmoe.ai/"
            , "https://fasttext.cc/blog/2017/10/02/blog-post.html"
            , "https://files.eric.ed.gov/fulltext/EJ746292.pdf"
            , "https://files.givewell.org/files/conversations/Stanley%20Young%20slides%20on%20multiple%20testing.pdf"
            , "https://foreignpolicy.com/2012/09/28/aircraft-carriers-in-space/"
            , "https://forum.evageeks.org/post/500631/Who-Can-Be-The-Seele-Children/#500631"
            , "https://web.archive.org/web/20150331014003/https://forum.quantifiedself.com/thread-zeo-shutting-down-export-your-data?pid=3412#pid3412"
            , "https://forums.animesuki.com/showpost.php?p=3584198"
            , "https://foundation.wikimedia.org/wiki/Privacy_policy"
            , "https://freedomdefined.org/Licenses/NC"
            , "https://fullfrontal.moe/interview-mahiro-maeda/"
            , "https://futurism.com/neural-network-draw-doom-guy-high-res"
            , "https://galois.com/blog/2008/9/17/parsing-the-linux-kernel-with-haskell-experience-with-langua.html"
            , "https://gamefaqs.gamespot.com/boards"
            , "https://gameprogrammingpatterns.com/dirty-flag.html"
            , "https://gaotianyu.xyz/prompting/"
            , "https://gizmodo.com.au/2020/05/the-internet-furry-drama-raising-big-questions-about-artificial-intelligence/"
            -- , "https://globalguerrillas.typepad.com/" -- excluded due to spoofing fake errors
            , "https://globalvoices.org/2011/11/05/japans-it-exodus-a-personal-perspective-part-2/print/"
            , "https://gondwanaland.com/mlog/2011/10/21/almost-innovation/"
            , "https://googleblog.blogspot.com/2011/10/fall-sweep.html"
            , "https://googleprojectzero.blogspot.com/2017/07/trust-issues-exploiting-trustzone-tees.html"
            , "https://googlesystem.blogspot.com/2013/07/google-alerts-drops-rss-feeds.html"
            , "https://gpt3demo.com/apps/magicemail-io"
            , "https://gradientscience.org/data_rep_bias/"
            , "https://gutenberg.ca/ebooks/smithcordwainer-onthegemplanet/smithcordwainer-onthegemplanet-00-h.html"
            , "https://gutenberg.net.au/ebooks03/0300151h.html"
            , "https://guzey.com/books/why-we-sleep/#no-shorter-sleep-does-not-imply-shorter-life-span"
            , "https://hackage.haskell.org/package/archiver"
            , "https://hakaimagazine.com/features/can-we-really-be-friends-octopus/"
            , "https://handbook-5-1.cochrane.org/chapter_8/8_assessing_risk_of_bias_in_included_studies.htm"
            , "https://hapgood.us/2019/03/28/network-heuristics/"
            , "https://harpers.org/archive/2013/09/the-devils-bait/?single=1"
            , "https://hdsr.mitpress.mit.edu/pub/wi9yky5c/release/2"
            , "https://healthland.time.com/2012/04/05/frozen-assets-why-u-s-sperm-is-a-hot-commodity/"
            , "https://herbsutter.com/welcome-to-the-jungle/"
            , "https://highnoongmt.wordpress.com/2015/08/13/deep-learning-for-assisting-the-process-of-music-composition-part-3/"
            , "https://historycooperative.org/a-short-history-on-sleep-before-the-industrial-revolution/"
            , "https://hpmor.com/chapter/64"
            , "https://hub.darcs.net/simon/darcsden"
            , "https://ideas.repec.org/a/eee/ecolet/v91y2006i3p395-401.html"
            , "https://idlewords.com/2010/03/scott_and_scurvy.htm"
            , "https://ifdo.ca/~seymour/runabc/abcguide/abc2midi_guide.html"
            , "https://iforcedabot.com/what-can-a-fake-news-detector-do/"
            , "https://image-net.org/challenges/beyond_ilsvrc.php"
            , "https://infoproc.blogspot.com/2010/10/wigner-recollections.html"
            , "https://intelligence.org/2016/09/12/new-paper-logical-induction/"
            , "https://iqcomparisonsite.com/"
            , "https://isomerdesign.com/pihkal/read/tk/35"
            , "https://it.wikipedia.org/wiki/Gualtiero_Cannarsi"
            , "https://jamesyu.org/about/"
            , "https://japansociety.org/resources/content/2/0/5/4/documents/azuma_mcgray%20interview.pdf"
            , "https://jasoncrawford.org/"
            , "https://jaspervdj.be/files/2011-gsoc-text-utf8-proposal.html"
            , "https://jax.readthedocs.io/en/latest/en/latest/notebooks/xmap_tutorial.html"
            , "https://jaypsong.blog/2011/11/15/poverty-by-moon-byung-ran/"
            , "https://jdlm.info/articles/2018/03/18/markov-decision-process-2048.html"
            , "https://jessegalef.com/2013/01/27/messing-with-time-why-the-flash-is-in-hell/"
            , "https://jetpress.org/volume1/moravec.htm"
            , "https://jgeekstudies.org/2016/05/19/great-attractor-ttgl/"
            , "https://joa.sh/posts/2015-09-14-prerender-mathjax.html"
            , "https://johncwright.livejournal.com/117818.html"
            , "https://jonmillward.com/blog/studies/deep-inside-a-study-of-10000-porn-stars/"
            , "https://journal.stuffwithstuff.com/2020/04/05/crafting-crafting-interpreters/"
            , "https://jtauber.com/blog/2004/11/26/programmed_vocabulary_learning_as_a_travelling_salesman_problem/"
            , "https://justgetflux.com/"
            , "https://kajsotala.fi/2012/10/technology-will-destroy-human-nature/"
            , "https://keras.io/"
            , "https://kev.town/2013/04/30/why-did-why-the-lucky-stiff-quit/"
            , "https://kk.org/thetechnium/the-shirky-prin/"
            , "https://knightcolumbia.org/content/the-case-for-digital-public-infrastructure"
            , "https://kojimars.at.webry.info/201004/article_16.html"
            , "https://komonews.com/news/local/indictment-washington-teen-drug-dealers-thrived-on-darknet"
            , "https://krebsonsecurity.com/"
            , "https://laion.ai/laion-400-open-dataset/"
            , "https://lavaan.ugent.be/"
            , "https://learning.mpi-sws.org/memorize/"
            , "https://ledger-cli.org/"
            , "https://legacy.imagemagick.org/Usage/crop/#crop"
            , "https://lettersofnote.com/2012/03/28/the-skills-of-leonardo-da-vinci/"
            , "https://lifescivc.com/2011/03/academic-bias-biotech-failures/"
            , "https://lithub.com/here-are-the-biggest-fiction-bestsellers-of-the-last-100-years/?single=true"
            , "https://longitudinal.blog/co2-series-part-2-co2-removal/"
            , "https://longtermrisk.org/the-importance-of-wild-animal-suffering/"
            , "https://lucumr.pocoo.org/2013/7/23/licensing/"
            , "https://magazine.atavist.com/an-arrogant-way-of-killing/"
            , "https://magenta.tensorflow.org/piano-transformer"
            , "https://mailchi.mp/459b1e4f860d/an-152how-weve-overestimated-few-shot-learning-capabilities"
            , "https://mail.haskell.org/pipermail/haskell-cafe/2011-February/089183.html"
            , "https://mail.haskell.org/pipermail/haskell-cafe/2013-April/107389.html"
            , "https://mako.cc/copyrighteous/revisiting-the-rise-and-decline"
            , "https://mason.gmu.edu/~rhanson/greatfilter.html"
            , "https://mathbabe.org/2012/11/20/columbia-data-science-course-week-12-predictive-modeling-data-leakage-model-evaluation/"
            , "https://mathshistory.st-andrews.ac.uk/Extras/Keynes_Newton/"
            , "https://mathworld.wolfram.com/FermatsLastTheorem.html"
            , "https://mattlakeman.org/2020/01/22/the-new-epidemic-my-experience-of-losing-a-friend-to-heroin/"
            , "https://mc-stan.org/"
            , "https://meta.wikimedia.org/wiki/Research:Wiki_Participation_Challenge#Dissemination"
            , "https://meteuphoric.com/2010/08/08/on-the-hostility-of-wives/#comment-1427"
            , "https://web.archive.org/web/20230401050010/https://metropolitician.blogs.com/scribblings_of_the_metrop/2010/06/facebook-taking-over-korea-as-predicted.html"
            , "https://michaelnielsen.org/blog/three-myths-about-scientific-peer-review/"
            , "https://mikepower.pressfolios.com/"
            , "https://milan.cvitkovic.net/writing/things_youre_allowed_to_do/"
            , "https://minimaxir.com/2017/06/imgur-decline/"
            , "https://mitp-content-server.mit.edu/books/content/sectbyfn/books_pres_0/6515/sicp.zip/sicp.html"
            , "https://mkv25.net/dfma/map-8269"
            , "https://mlp.fandom.com/wiki/The_Perfect_Pear"
            , "https://mmlab.ie.cuhk.edu.hk/projects/CelebA.html"
            , "https://mssv.net/2020/08/02/what-args-can-teach-us-about-qanon/"
            , "https://my.pgp-hms.org/users"
            , "https://my.vanderbilt.edu/smpy/publications/camilla-benbow/"
            , "https://nautil.us/will-90-become-the-new-60-235929/"
            , "https://www.nbc-2.com/news/crime/2022/01/04/man-arrested-in-desoto-county-drug-bust-on-new-years-eve"
            , "https://ncase.me/"
            , "https://neurosciencenews.com/brain-connectome-artificial-neural-networks/"
            , "https://newcriterion.com/article/a-good-list/"
            , "https://nickbostrom.com/papers/astronomical-waste/"
            , "https://nintil.com/science-ending-frontier"
            , "https://nootropicsdepot.com/bacopa/"
            , "https://notes.pinboard.in/u:vitorio/05dec9f04909d9b6edff"
            , "https://numinous.productions/ttft/"
            , "https://nunosempere.com/blog/2023/01/30/an-in-progress-experiment-to-test-how-laplace-s-rule-of/"
            , "https://nymag.com/news/features/70830/#print"
            , "https://okmij.org/ftp/Streams.html"
            , "https://ooo.ghostbows.ooo/"
            , "https://originstamp.com/s/7306a744a285474742f4f9ae8ddae8214fb7625348d578fb3077fb0bae92b8f1"
            , "https://orionmagazine.org/article/interviews-with-an-octopus/"
            , "https://orwell.ru/library/articles/nose/english/e_nose"
            , "https://oscarbonilla.com/2009/05/visualizing-bayes-theorem/"
            , "https://ourworldindata.org/happiness-and-life-satisfaction"
            , "https://palmerlab.org/neuroticism-and-depression-gwas-consortium-paper-accepted-for-publication-in-jama-psychiatry-abraham-palmer-harriet-de-wit-and-amy-hart-are-co-authors/"
            , "https://pandoc.org/"
            , "https://papers.ssrn.com/sol3/papers.cfm?abstract_id=3819317"
            , "https://parahumans.wordpress.com/2011/06/21/gestation-1-4/"
            , "https://parametric.press/issue-01/unraveling-the-jpeg/"
            , "https://parti.research.google/"
            , "https://paulfchristiano.com/ea/"
            , "https://penelope.uchicago.edu/hydrionoframes/hydrion.html"
            , "https://people.com/movies/frankie-muniz-memory-loss-doesnt-bother-him/"
            , "https://people.csail.mit.edu/mrub/VisualMic/"
            , "https://people.idsia.ch/~juergen/creativity.html"
            , "https://personalitytest.net/ipip/index.html"
            , "https://personal.math.ubc.ca/~cass/Euclid/byrne.html"
            , "https://petertodd.org/2016/opentimestamps-announcement"
            , "https://philip.greenspun.com/teaching/teaching-software-engineering"
            , "https://plato.stanford.edu/entries/moral-anti-realism/index.html"
            , "https://playground.tensorflow.org/"
            , "https://politicalcalculations.blogspot.com/2011/07/how-much-are-geezers-displacing-teens.html"
            , "https://poniesatdawn.bandcamp.com/album/dreamwalkerstrack/peace-at-last"
            , "https://popcon.ubuntu.com/"
            , "https://proceedings.mlr.press/v119/huang20f.html"
            , "https://progressstudies.school/"
            , "https://projects.jsonline.com/news/2016/12/11/the-price-of-being-wrong.html"
            , "https://projects.tampabay.com/projects/2016/food/farm-to-fable/restaurants/"
            , "https://psychcentral.com/pro/sparlon-and-adhd-the-power-of-a-7-year-old/002889.html"
            , "https://psych.hanover.edu/JavaTest/CLE/Cognition/Cognition/MentalRotation.html"
            , "https://psychonautwiki.org/wiki/Wake_initiated_lucid_dream"
            , "https://publishing.cdlib.org/ucpressebooks/view?docId=ft8489p25j&chunk.id=d0e2683&toc.id=d0e2575&brand=eschol"
            , "https://pudding.cool/2021/03/love-and-ai/"
            , "https://pytorch.org/"
            , "https://qualiacomputing.com/2019/11/15/break-out-of-the-simulation-day-televised-entity-contact-injection-pulling-experiments-and-the-brain-as-a-game-engine/"
            , "https://quantifiedself.com/blog/spaced-repetition-and-learning/"
            , "https://quantum.country/qcvc"
            , "https://queue.acm.org/detail.cfm?ref=rss&id=2856460"
            , "https://quillette.com/2021/11/29/the-universal-structure-of-storytelling/"
            , "https://qwantz.com/index.php?comic=2366"
            , "https://racket-lang.org/"
            , "https://radiolab.org/podcast/122291-in-running/transcript"
            , "https://ralphmerkle.com/cryo/techFeas.html"
            , "https://rationality.org/"
            , "https://rdiff-backup.net/"
            , "https://read-the-samples.netlify.app/sample_1353/"
            , "https://reflectivedisequilibrium.blogspot.com/"
            , "https://replicationindex.com/"
            , "https://retractionwatch.com/2014/07/08/sage-publications-busts-peer-review-and-citation-ring-60-papers-retracted/"
            , "https://ricon.dev/"
            , "https://rjlipton.com/2014/07/21/shifts-in-algorithm-design/"
            , "https://rjlipton.com/the-gdel-letter/"
            , "https://blog.rootsofprogress.org/nuclear-physics"
            , "https://row1.ca/pixels-and-their-neighbors"
            , "https://safebooru.org/index.php?page=post&s=list&tags=heterochromia"
            , "https://samoburja.com/the-youtube-revolution-in-knowledge-transfer/"
            , "https://scale.com/blog/chatgpt-vs-claude"
            , "https://scarybeastsecurity.blogspot.com/2016/11/0day-exploit-compromising-linux-desktop.html"
            , "https://scholars-stage.org/reflections-on-chinas-stalinist-heritage-ii-just-how-totalitarian-is-modern-china/"
            , "https://schoolgirlmilkycrisis.com/2011/10/10/get-lost/#comment-236173"
            , "https://sciencebasedmedicine.org/antioxidants-and-exercise-more-harm-than-good/"
            , "https://sciencebulletin.org/archives/9946.html"
            , "https://scottaaronson.blog/?p=346"
            , "https://seths.blog/2005/03/dont_shave_that/"
            , "https://sevensecularsermons.org/about/"
            , "https://sf-encyclopedia.com/entry/smith_cordwainer"
            , "https://shkspr.mobi/blog/2013/03/preparing-for-the-collapse-of-digital-civilization/"
            , "https://sifter.org/iqtest/"
            , "https://signalvnoise.com/posts/2942-exit-interview-founders-look-back-at-acquisitions-by-google-aol-microsoft-and-more"
            , "https://slatestarcodex.com/2015/09/23/vegetarianism-for-meat-eaters/"
            , "https://slimemoldtimemold.com/2022/01/27/like-a-lemon-to-a-lime-a-lime-to-a-lemon/"
            , "https://socghop.appspot.com/gsoc/student_project/show/google/gsoc2009/haskell/t124022467805"
            , "https://socialsciences.mcmaster.ca/econ/ugcm/3ll3/menger/money.txt"
            , "https://soranews24.com/2019/02/14/video-shows-off-hundreds-of-beautiful-ai-created-anime-girls-in-less-than-a-minute%E3%80%90video%E3%80%91/"
            , "https://spikejapan.wordpress.com/about/"
            , "https://sites.temple.edu/immerman/address-to-the-nation-on-national-security-by-president-ronald-reagan-march-23-1983/"
            , "https://srconstantin.wordpress.com/2014/05/07/beyond-the-one-percent-categorizing-extreme-elites/"
            , "https://sre.google/sre-book/eliminating-toil/"
            , "https://status451.com/2017/01/20/days-of-rage/"
            , "https://stephenmalina.com/post/2021-07-01-energetic-aliens-among-us/"
            , "https://stevenson.lab.uconn.edu/scaling/"
            , "https://story.californiasunday.com/cosmic-crisp-apple-launch/"
            , "https://stratechery.com/2019/the-google-squeeze/"
            , "https://strategy.wikimedia.org/wiki/Editor_Trends_Study/Results#Cohort_Analysis"
            , "https://svilentodorov.xyz/blog/gpt-15b-chat-finetune/"
            , "https://synapse.koreamed.org/articles/1101514"
            , "https://taooftea.com/product/frozen-summit/"
            , "https://stats.grok.se/en/201109/Talk%3ABarack_Obama"
            , "https://teageegeepea.tripod.com/maumau.html"
            -- , "https://texample.net/tikz/examples/hydrogen-splitting/"
            , "https://text.npr.org/974534021"
            , "https://thebaffler.com/latest/stick-to-the-plan-james"
            , "https://thebrowser.com/"
            , "https://thegrandnarrative.com/about-2/"
            , "https://thehardestscience.com/2011/09/29/does-psilocybin-cause-changes-in-personality-maybe-but-not-so-fast/"
            , "https://thelastpsychiatrist.com/2011/09/how_to_be_mean_to_your_kids.html"
            , "https://the-liliquarium.livejournal.com/1482.html"
            , "https://thenewstatistics.com/itns/2018/04/03/weve-been-here-before-the-replication-crisis-over-the-pygmalion-effect/"
            , "https://gwern.net/doc/fiction/humor/2013-09-03-danielmalleryortberg-thetoast-anotheremptylifelessplanetfound.html"
            , "https://thisanimedoesnotexist.ai/"
            , "https://thisrentaldoesnotexist.com/"
            , "https://thoughtcrime.crummy.com/2009/Error.html"
            , "https://threadreaderapp.com/thread/1187161460033458177.html"
            , "https://time.com/time/printout/0,8816,1893946,00.html"
            , "https://tomcritchlow.com/2020/06/09/quotebacks/"
            , "https://tosche.net/blog/ink-traps-and-pals"
            , "https://training.kalzumeus.com/newsletters/archive/saas_pricing"
            , "https://transformer-circuits.pub/2021/framework/index.html#anthropic"
            , "https://trixter.oldskool.org/2014/06/19/8088-domination-post-mortem-part-1/"
            , "https://tug.org/FontCatalogue/otherfonts.html#initials"
            , "https://unenumerated.blogspot.com/2011/05/bitcoin-what-took-ye-so-long.html"
            , "https://unqualified-reservations.blogspot.com/2008/01/how-i-stopped-believing-in-democracy.html"
            , "https://unsongbook.com/chapter-4-tools-were-made-and-born-were-hands/"
            , "https://vasilishynkarenka.com/gpt-3/"
            , "https://vastabrupt.com/2018/08/07/time-war-briefing-for-neolemurian-agents/"
            , "https://vast.ai/"
            , "https://vdfresearch.org/"
            , "https://venturebeat.com/2017/10/01/globalfoundries-next-generation-chip-factories-will-cost-at-least-10-billion/view-all/"
            , "https://vfxblog.com/2017/08/23/the-tech-of-terminator-2-an-oral-history/"
            , "https://vinoshipper.com/shop/silver_hand_meadery/raspberry_passion_22,497"
            , "https://warontherocks.com/2021/08/foreign-fighters-and-cheese-bells/"
            , "https://washingtonmonthly.com/features/2007/0709.careycascadia.html"
            , "https://w.atwiki.jp/toho/pages/727.html"
            , "https://wavemotioncannon.com/2017/01/03/yoh-yoshinari-interview-animestyle-032013-part-33/"
            , "https://web.archive.org/web/20100126083055/https://www.unc.edu/courses/2008spring/psyc/270/001/counterbalancing.html"
            , "https://web.archive.org/web/20140314232216/https://www.zeit.de/2014/12/drogenhandel-silk-road-pfandleiher"
            , "https://web.archive.org/web/20150211211107/https://support.google.com/news/answer/1638638"
            , "https://web.archive.org/web/20150816235023/https://www.thedenverchannel.com/news/colorado-springs-area/air-force-academy-cadet-3rd-class-nathaniel-penalosa-accused-of-using-and-distributing-drugs-on-base"
            , "https://web.archive.org/web/20160205133519/https://www.baka-tsuki.org/project/index.php?title=Utsuro_no_Hako:Volume_1"
            , "https://web.archive.org/web/20171020041641/http://nitro.biosci.arizona.edu/zbook/NewVolume_2/newvol2.html"
            , "https://web.archive.org/web/20190415123208/https://thiscardoesnotexist.glitch.me/"
            , "https://web.archive.org/web/20230604002332/https://thiseyedoesnotexist.com/story/"
            , "https://webcitation.org/5mYown8VS"
            , "https://web.media.mit.edu/~minsky/papers/Why%20programming%20is--.html"
            , "https://what-if.xkcd.com/76/"
            , "https://whyevolutionistrue.com/2018/03/04/a-human-chimera/"
            , "https://wiki.archiveteam.org/index.php/Google_Reader"
            , "https://wiki.haskell.org/index.php?title=&search=&fulltext=Search"
            , "https://foundation.wikimedia.org/wiki/Archive:Planned_Spending_Distribution_2008-2009"
            , "https://writeswith.com/"
            , "https://writings.stephenwolfram.com/2012/03/the-personal-analytics-of-my-life/"
            , "https://www.aboutamazon.com/news/company-news/2016-letter-to-shareholders"
            , "https://www.adamsmith.org/research/back-in-the-ussr"
            , "https://www.adelaidenow.com.au/news/south-australia/man-arrested-after-220000-worth-of-wizard-drug-25inbome-intercepted/story-fni6uo1m-1227075205971"
            , "https://www.aging-us.com/article/100415/text"
            , "https://www.aiweirdness.com/this-is-the-openai-api-it-makes-spookily-20-06-11/"
            , "https://www.alexirpan.com/2015/09/24/how-an-audio-play-about-a-time-traveling-pony-turned-me-into-a-fanboy.html"
            , "https://www.alicemaz.com/writing/minecraft.html"
            , "https://www.alignmentforum.org/posts/Haawpd5rZrzkzvYRC/an-162-foundation-models-a-paradigm-shift-within-ai"
            , "https://www.allencheng.com/starting-a-business-around-gpt-3-is-a-bad-idea/"
            , "https://www.antipope.org/charlie/blog-static/2011/08/usenix-2011-keynote-network-se.html"
            , "https://archive-it.org/"
            , "https://www.artnome.com/news/2019/3/27/why-is-ai-art-copyright-so-complicated"
            , "https://www.baka-tsuki.org/project/index.php?title=Interview_with_Tanigawa_Nagaru"
            , "https://www.baltimoresun.com/2013/11/07/silk-road-employee-pleads-guilty-in-maryland/"
            -- , "https://www.becker-posner-blog.com/2006/12/charitable-foundations--posners-comment.html" -- spoofing fake 403 errors
            , "https://www.belfasttelegraph.co.uk/news/republic-of-ireland/article30724056.ece"
            , "https://www.bemmu.com/first-year-of-candy-japan"
            , "https://www.benkuhn.net/11/"
            , "https://www.bitsaboutmoney.com/archive/financial-innovation-is-happening/"
            , "https://www.bostonglobe.com/ideas/2014/03/15/the-poor-neglected-gifted-child/rJpv8G4oeawWBBvXVtZyFM/story.html"
            , "https://www.brainpreservation.org/?path=prize"
            , "https://www.brookings.edu/articles/federal-programs-for-youth-more-of-the-same-wont-work/"
            , "https://www.bu.edu/globalbeat/nuclear/Kristensen1097.html"
            , "https://www.buzzricksons.jp/"
            , "https://www.c82.net/euclid/"
            , "https://www.candyjapan.com/results-from-box-design-ab-test"
            , "https://www.catalogtree.net/about"
            , "https://www.cato-unbound.org/2007/09/10/robin-hanson/cut-medicine-half/"
            , "https://www.cbsnews.com/news/food-prices-increase-most-in-36-years/"
            , "https://www.cdc.gov/trendstatement/"
            , "https://www.chicagotribune.com/1989/02/28/booze-and-the-muse/"
            , "https://www.chrisplaysgames.com/gadgets/2019/02/25/how-i-learned-to-stop-worrying-and-love-transfer-learning/"
            , "https://www.chrisstucchio.com/blog/2014/equal_weights.html"
            , "https://www.cleveland.com/lifestyles/2008/01/some_girl_scout_cookies_change.html"
            , "https://www.cnn.com/2009/WORLD/asiapcf/06/05/japan.herbivore.men/index.html"
            , "https://www.coderelay.io/fontemon.html"
            , "https://www.cogmed.com/"
            , "https://www.collectorsweekly.com/articles/cast-iron-doorstops/"
            , "https://www.couriermail.com.au/news/queensland/gladstone/gladstone-man-arrested-in-worldwide-firearms-bust/news-story/f5bd03cfa834aad581b828fba8c07af2"
            , "https://www.cryonicscalculator.com/"
            , "https://www.cs.dartmouth.edu/~sergey/wm/"
            , "https://www-cs-faculty.stanford.edu/~knuth/faq.html"
            , "https://www.cs.odu.edu/~mln/pubs/widm-2006/lazyp-widm06.pdf"
            , "https://www.cs.toronto.edu/~kriz/cifar.html"
            , "https://www.cs.virginia.edu/~robins/YouAndYourResearch.html"
            , "https://www.cylab.cmu.edu/"
            , "https://www.daemonology.net/blog/2011-06-03-insecurity-in-the-jungle.html"
            , "https://www.dafont.com/deutsche-zierschrif.font"
            , "https://www.dailydot.com/unclick/dark-web-black-market-reloaded-adam-bunger-gun-sales-arrest/"
            , "https://www.dailymail.co.uk/health/article-2126761/Bertold-Wiesner-British-scientist-fathered-600-children-donating-sperm-fertility-clinic.html"
            , "https://www.dartmouth.edu/~milton/reading_room/conscience/text.shtml"
            , "https://www.deeplearningbook.org/contents/rnn.html"
            , "https://www.deseret.com/1995/7/20/19183190/teller-regrets-failure-to-seek-a-demonstration-option/"
            , "https://www.discoverteas.com/246/218/tea/oolong-teas/p-glenburn-moonshine-oolong"
            , "https://www.doc88.com/p-397166703921.html"
            , "https://www.drmaciver.com/2019/05/how-to-do-hard-things/"
            , "https://www.e-codices.unifr.ch/en/vad/0296/093v"
            , "https://www.ecologyandsociety.org/vol9/iss1/art6/main.html"
            , "https://www.econlib.org/archives/2012/03/the_roots_of_le.html"
            , "https://www.economist.com/science-and-technology/2009/04/08/wired?story_id=13437729"
            , "https://www.econtalk.org/matt-ridley-on-how-innovation-works/"
            , "https://www.edwardtufte.com/bboard/q-and-a-fetch-msg?msg_id=0003wk#bboard_content"
            , "https://www.equator-network.org/reporting-guidelines/"
            , "https://www.equestriadaily.com/search/label/Music"
            , "https://www.eugenewei.com/blog/2017/5/11/jpeg-your-ideas"
            , "https://www.evamonkey.com/ask-john/has-evangelion-influenced-contemporary-gundam-anime.php"
            , "https://www.explainxkcd.com/wiki/index.php/Randall"
            , "https://www.fadedpage.com/link.php?file=20160325.html#Page_107"
            , "https://www.fast.ai/2018/08/10/fastai-diu-imagenet/"
            , "https://www.fhi.ox.ac.uk/"
            , "https://www.filfre.net/2020/01/master-of-orion/"
            , "https://www.find-more-books.com/"
            , "https://www.freakonomicsexperiments.com/"
            , "https://www.ft.com/content/da7b86a3-a8a7-4a0b-a26f-38abda7e7f86"
            , "https://gawker.com/5926440/are-authorities-closing-in-on-the-online-drug-market-silk-road"
            , "https://www.genealogy.math.ndsu.nodak.edu/id.php?id=42477"
            , "https://www.ghibli.jp/kazetachinu/character.html"
            , "https://www.globalsecurity.org/wmd/world/russia/arzamas_nuc.htm"
            , "https://www.gnxp.com/WordPress/2017/12/12/most-people-say-they-think-nurture-is-more-important-than-nature-especially-white-americans/"
            , "https://www.gq.com/story/fake-hitman-murder-for-hire"
            , "https://www.grandforksherald.com/news/crime-and-courts/3704033-oregon-man-indicted-fatal-grand-forks-overdose-case"
            , "https://www.gutenberg.org/files/5978/5978-h/5978-h.htm#c15"
            , "https://www.harrowell.org.uk/blog/2018/01/31/in-the-eternal-inferno-fiends-torment-ronald-coase-with-the-fate-of-his-ideas/"
            , "https://www.heraldsun.com.au/news/law-order/man-faces-jail-after-2700-drug-tablets-on-notorious-site-silk-road/news-story/4ec3a87919d9d591057f3d7494336dd0"
            , "https://www.hsx.com/security/feature.php?type=opening"
            , "https://www.html-tidy.org/"
            , "https://humanprogress.org/"
            , "https://www.independent.ie/irish-news/suspected-online-international-drugs-ring-smashed-by-gardai/30724000.html"
            , "https://www.infranken.de/lk/forchheim/im-darknet-mit-drogen-gehandelt-kripo-entlarvt-neun-maenner-aus-franken-art-1355609"
            , "https://www.inkandswitch.com/index.html"
            , "https://www.intechopen.com/source/html/17370/media/image3.jpeg"
            , "https://www.itmedia.co.jp/news/articles/1711/28/news020.html"
            , "https://www.jamesfadiman.com/"
            , "https://www.japaninc.com/cpj/magazine/issues/1998/mar98/ohsuga.html"
            , "https://www.jdmoyer.com/2010/03/04/sleep-experiment-a-month-with-no-artificial-light/"
            , "https://www.jefftk.com/p/breaking-down-cryonics-probabilities"
            , "https://www.joelonsoftware.com/2000/11/22/20001122/"
            , "https://www.johndcook.com/blog/2011/11/22/norris-number/"
            , "https://www.johnsonessays.com/the-rambler/no-21-the-anxieties-of-literature-not-less-than-those-of-publick-stations-the-inequality-of-authors-writings/"
            , "https://www.justinpinkney.com/blog/2020/stylegan-network-blending/"
            , "https://www.kalzumeus.com/2012/08/13/doubling-saas-revenue/"
            , "https://www.kooslooijesteijn.net/blog/semantic-sidenotes"
            , "https://www.lehighvalleylive.com/bethlehem/2015/02/west_bethlehem_drugraid_prompt.html"
            , "https://www.lesswrong.com/posts/GytPrQ9cT46k9etoz/living-forever-is-hard-or-the-gompertz-curve"
            , "https://www.lesswrong.com/posts/wTKjRFeSjKLDSWyww/possible-takeaways-from-the-coronavirus-pandemic-for-slow-ai"
            , "https://www.lesswrong.com/tag/adding-up-to-normality"
            , "https://web.archive.org/web/20241007111601/https://www.livestrong.com/article/283811-vitamin-d-deficiency-heart-palpitations/"
            , "https://www.mail-archive.com/cryptography@metzdowd.com/msg09975.html"
            , "https://www.math.uwaterloo.ca/tsp/pla85900/index.html"
            -- , "https://www.mattridley.co.uk/blog/the-wealth-of-urban-biodiversity/"
            , "https://www.mcall.com/2016/05/06/esu-student-busted-buying-lsd-on-the-dark-web-police-say/"
            , "https://www.mediawiki.org/wiki/Multilingual_MediaWiki"
            , "https://www.mentalfloss.com/article/94569/clair-patterson-scientist-who-determined-age-earth-and-then-saved-it"
            , "https://www.mercurynews.com/2016/01/27/san-jose-former-postal-inspector-to-serve-3-years-for-possessing-stolen-mail-marijuana-trafficking/"
            , "https://www.metafilter.com/91797/working-working-memory-with-dual-nback#3108845"
            , "https://www.metopera.org/season/in-cinemas/2019-20-season/akhnaten-live-in-hd/"
            , "https://www.metzdowd.com/pipermail/cryptography/2015-January/024433.html"
            -- , "https://www.miamiherald.com/news/local/community/miami-dade/article199044679.html"
            , "https://www.microdose.me/"
            , "https://www.motherjones.com/politics/2016/06/cca-private-prisons-corrections-corporation-inmates-investigation-bauer/"
            , "https://www.nationalgeographic.com/magazine/article/evolution-genetics-medicine-brain-technology-cyborg"
            , "https://www.nbcnews.com/storyline/isis-terror/isis-head-baghdadi-wife-fell-love-line-say-sources-n260291"
            , "https://www.newsday.com/news/region-state/robert-c-cardillo-jr-picked-up-12-pounds-of-pot-worth-50-000-from-post-office-cops-say-a50126"
            , "https://www.nextbigfuture.com/2011/03/global-health-risks.html"
            , "https://www.nextplatform.com/2019/08/20/big-blue-open-sources-power-chip-instruction-set/"
            , "https://www.noisebridge.net/wiki/Compass_Vibro_Anklet"
            , "https://www.nplusonemag.com/issue-3/reviews/adventures-of-a-man-of-science/"
            , "https://www.npr.org/sections/alltechconsidered/2017/06/08/531796329/eager-to-burst-his-own-bubble-a-techie-made-apps-to-randomize-his-life"
            , "https://www.nps.gov/subjects/bears/safety.htm"
            , "https://www.nydailynews.com/2016/09/20/texas-man-arrested-after-dark-web-attempt-to-buy-explosives-and-blow-up-building/"
            , "https://www.ohyouprettythings.com/free"
            , "https://www.orbuch.com/nets-reading-list/"
            , "https://www.oregonlive.com/portland/2015/08/players_in_biggest_silk_road_m.html"
            , "https://www.oricon.co.jp/news/2075319/full/"
            , "https://www.orlandosentinel.com/2015/02/16/ucf-student-had-marijuana-shipped-to-campus-apartment-cops-say/"
            , "https://www.owenstephens.co.uk/blog/2011/09/03/gsoc_darcs_bridge__results.html"
            , "https://www.palladiummag.com/2018/11/29/a-week-in-xinjiangs-absolute-surveillance-state/"
            , "https://www.pcmag.com/archive/how-a-chip-fab-is-built-249666"
            , "https://www.pewresearch.org/social-trends/2012/02/16/the-rise-of-intermarriage/"
            , "https://www.poetryfoundation.org/poems/45173/jubilate-agno"
            , "https://www.popsci.com/woolly-mammoth-dna-brought-life-elephant-cells/"
            , "https://www.pragmatic.ml/a-survey-of-methods-for-incorporating-long-term-context/"
            , "https://www.princeton.edu/~graphicarts/2012/04/feuillets_dart.html"
            , "https://www.prolific.com/"
            , "https://www.psychiatryinvestigation.org/journal/view.php?number=865"
            , "https://www.punchlinedesign.net/pun_generator"
            , "https://www.r-bloggers.com/2014/01/visualization-series-using-scatterplots-and-models-to-understand-the-diamond-market-so-you-dont-get-ripped-off/"
            , "https://www.rdocumentation.org/packages/EnvStats/versions/2.1.0/topics/evNormOrdStats"
            -- , "https://www.reg.ru/blog/anime-generation-with-stylegan/" -- bizarre infinite-redirect-loop problem only with curl
            , "https://www.richardcarrier.info/archives/14522"
            , "https://www.rifters.com/crawl/?p=791"
            , "https://www.ruder.io/recent-advances-lm-fine-tuning/"
            , "https://www.rwagner.net/libretti/parsifal/e-pars-a3.html"
            , "https://www.rxshop.md/products/antinarcoleptic/buy-modafinil-online-order-modvigil/"
            -- , "https://www.sacbee.com/news/local/crime/article2598075.html"
            , "https://www.salon.com/2007/04/12/castaneda/"
            , "https://news.sankakucomplex.com/2011/11/01/which-are-worse-the-seiyuu-or-their-creepy-fans/"
            , "https://www.sapa-project.org/"
            , "https://www.schneier.com/blog/archives/2008/10/the_seven_habit.html"
            , "https://www.scielo.br/j/rbp/a/fCXVCnz7PGRpbwNgX6DkJwC/?format=pdf"
            , "https://www.sciencenews.org/view/generic/id/65600/title/Fish_oil_fails_to_hold_off_heart_arrhythmia"
            , "https://www.scottaaronson.com/democritus/"
            , "https://www.sfgate.com/news/article/viral-video-bear-dogs-terriers-california-home-16104193.php"
            , "https://www.shawlocal.com/northwest-herald/2016/06/27/kane-county-sheriffs-deputy-wife-of-ex-mchenry-county-undersheriff-faces-drug-charges/axibe17/"
            , "https://www.shawwn.com/swarm"
            , "https://www.simplify.so/"
            , "https://www.sirlin.net/articles/playing-to-win"
            , "https://www.slate.com/articles/health_and_science/the_mouse_trap/2011/11/lab_mice_are_they_limiting_our_understanding_of_human_disease_.html"
            , "https://www.snpedia.com/index.php/Genomes"
            , "https://www.spiegel.de/panorama/ermittler-zerschlagen-internationalen-drogenring-a-910221.html"
            , "https://www.spiked-online.com/2014/11/18/a-colourful-history-of-progress/"
            , "https://www.spring.org.uk/2014/11/autism-new-studies-identify-dozens-more-associated-genes.php"
            , "https://www.sqlite.org/fasterthanfs.html"
            , "https://researchers.wls.wisc.edu/about/history/"
            , "https://www.standard.co.uk/news/crime/drugdealing-prison-librarian-bought-gun-on-the-dark-web-a3259961.html"
            , "https://www.straighttalkonevidence.org/2017/09/22/disappointing-findings-on-conditional-cash-transfers-as-a-tool-to-break-the-poverty-cycle-in-the-united-states/"
            , "https://www.stripes.com/news/pet-cloning-lab-in-s-korea-starts-military-dog-program-1.425640"
            , "https://www.stuff.co.nz/national/crime/10232509/Doing-time-for-drugs-bought-online"
            , "https://www.sumsar.net/blog/2015/04/the-non-parametric-bootstrap-as-a-bayesian-model/"
            , "https://www.sun-modalert.com/faq.php#shipping"
            , "https://www.syracuse.com/crime/2015/05/cops_seize_809_pills_170k_in_cash_in_raid_suny_oswego_student_charged.html"
            , "https://www.systutorials.com/docs/linux/man/1-midi2abc/"
            , "https://talyarkoni.org/blog/2011/01/10/the-psychology-of-parapsychology-or-why-good-researchers-publishing-good-articles-in-good-journals-can-still-get-it-totally-wrong/"
            , "https://www.thebeliever.net/oulipo-ends-where-the-work-begins/"
            , "https://www.thecut.com/2019/05/the-tinder-hacker.html"
            , "https://www.thefreelibrary.com/Sleep+debt+exacts+deceptive+cost.+%28Behavior%29.-a0100110931"
            , "https://www.theindiaforum.in/article/revolt-upper-castes"
            , "https://www.themtank.org/a-year-in-computer-vision"
            , "https://www.theregister.com/2001/01/10/nsa_runs_best_fab/"
            , "https://www.thestranger.com/features/2012/11/21/15337239/the-lying-disease"
            , "https://www.thisfursonadoesnotexist.com/"
            , "https://www.thisworddoesnotexist.com/"
            , "https://www.thriftbooks.com/"
            , "https://www.tranquiltuesdays.com/product/white-peony-white-tea/"
            , "https://www.trentonbricken.com/Tail-Free-Sampling/"
            , "https://www.trubrain.com/"
            , "https://www.tt-forums.net/viewtopic.php?f=29&t=37902&view=print"
            , "https://www.ubu.com/concept/racter.html"
            , "https://www.uk-anime.net/articles/The_Takeshi_Honda_interview/3"
            , "https://www.uliwestphal.de/elephas-anthropogenus/index.html"
            , "https://www.unicode.org/history/publicationdates.html"
            , "https://www.unqualified-reservations.org/2007/08/james-burnhams-dante-politics-as-wish/"
            , "https://www.unz.com/gnxp/the-cost-of-inbreeding-in-terms-of-health/"
            -- , "https://www.urbandictionary.com/define.php?term=Death%20flag" -- bizarre infinite-redirect issue in curl
            -- , "https://www.usnews.com/news/articles/2015/05/29/fewer-pot-packages-found-in-mail-as-legalization-takes-hold"
            , "https://www.vanityfair.com/culture/2010/02/exile-201002"
            , "https://www.vesta.earth/"
            , "https://www.vocativ.com/interactive/underworld/drugs/darknet-arrests-map/"
            , "https://www.wakapoetry.net/mys-viii-1426/"
            -- , "https://www.washingtontimes.com/news/2018/jun/2/minnesota-girl-who-cant-feel-pain-battles-insuranc/" -- spoofing fake 403 errors
            , "https://www.webmd.com/prostate-cancer/news/20090324/fatty-fish-may-cut-prostate-cancer-risk"
            , "https://www.wheels.org/spacewar/stone/rolling_stone.html"
            , "https://www.whichfaceisreal.com/"
            , "https://www.winehq.org/pipermail/wine-devel/2002-February/003912.html"
            , "https://www.wired.com/story/sleep-no-more-crusade-genetic-killer/"
            , "https://www.wired.com/story/lsd-microdosing-drugs-silicon-valley/"
            , "https://www.wolfewiki.com/pmwiki/pmwiki.php?n=WolfeWiki.Introduction"
            , "https://www.writingroutines.com/routines/"
            , "https://www.yalelawjournal.org/note/amazons-antitrust-paradox"
            , "https://www.yourdictionary.com/articles/examples-acrostic-poems"
            , "https://www.youtube.com/embed/gaMuet_ibWE"
            , "https://www.yudkowsky.net/"
            , "https://xkcd.com/481/"
            -- , "https://xtools.wmcloud.org/pages/en.wikipedia.org/Rhwawn"
            , "https://zlkj.in/"
            , "https://timetravel.mementoweb.org/"
            , "https://videolectures.net/videos/rldm2015_silver_reinforcement_learning"
            , "https://www6.austlii.edu.au/cgi-bin/viewdoc/au/cases/vic/VSCA/2015/35.html"
            , "https://www.abcb.com/newspaper/1999-12-30_asahi_01.htm"
            , "https://www.aleph.se/andart/archives/2012/09/flaws_in_the_perfection.html"
            , "https://www.alessonislearned.com/index.php?comic=14"
            , "https://www.chinadaily.com.cn/opinion/2011-09/17/content_13725092.htm"
            , "https://www.cjas.org/~leng/anno-ikuhara.txt"
            , "https://www.culhwch.info/index.html#footnote349-ref"
            , "https://www.davidbordwell.net/blog/2012/02/13/pandoras-digital-box-pix-and-pixels/"
            , "https://www.davidbrin.com/starwarsontrial.html"
            , "https://www.galbithink.org/names/agnames.htm"
            , "https://www.koreatimes.co.kr/www/news/nation/2008/05/117_24521.html"
            , "https://www.metafor-project.org/doku.php"
            , "https://www.michaellight.net/suns-intro/"
            , "https://www.moserware.com/2008/04/towards-moores-law-software-part-3-of-3.html"
            , "https://www.nyaa.eu/?page=torrentinfo&tid=255825"
            , "https://www.rfreitas.com/Astro/Xenopsychology.htm"
            , "https://www.righto.com/2015/11/macbook-charger-teardown-surprising.html#ref8"
            , "https://www.sciencemadness.org/talk/viewthread.php?tid=6401"
            , "https://www.tarsnap.com/scrypt.html"
            , "https://www.thesmokinggun.com/documents/silk-road-dealer-cooperating-567432"
            , "https://www.tlmc.eu/"
            , "https://tomodachi.de/"
            , "https://www.urbandharma.org/udharma4/mpe.html"
            , "https://www.vetta.org/2009/12/tick-tock-tick-tock-bing/"
            , "https://dialnet.unirioja.es/descarga/articulo/6084963.pdf"
            , "https://ai.stanford.edu/blog/in-context-learning/"
            , "https://alexdanco.com/2019/11/27/the-social-subsidy-of-angel-investing/"
            , "https://andyljones.com/"
            , "https://bayesianinvestor.com/amm/"
            , "https://blog.samaltman.com/black-swan-seed-rounds"
            , "https://books.worksinprogress.co/book/maintenance-of-everything/communities-of-practice/the-soul-of-maintaining-a-new-machine/1"
            , "https://carryiton.net/chain-letter/TOOMCL.html"
            , "https://colinraffel.com/"
            , "https://conversationswithtyler.com/episodes/fareed-zakaria/"
            , "https://cs.nyu.edu/~davise/papers/GPT3CompleteTests.html"
            , "https://danijar.com/project/director/"
            , "https://dataverse.harvard.edu/dataset.%C3%97html?persistentId=doi:10.7910/DVN/MVDWCS"
            , "https://geminiprotocol.net/docs/best-practices.gmi"
            , "https://gigamonkeys.com/"
            , "https://internetshakespeare.uvic.ca/doc/Ham_F1/complete/index.html"
            , "https://jack-clark.net/"
            , "https://maggieappleton.com/bidirectionals"
            , "https://nlp.stanford.edu/sentiment/index.html"
            , "https://ocw.mit.edu/courses/18-01sc-single-variable-calculus-fall-2010/"
            , "https://oeis.org/"
            , "https://paulgraham.com/airbnbs.html"
            , "https://psychclassics.yorku.ca/Ebbinghaus/index.htm"
            , "https://senseis.xmp.net/?Dame"
            , "https://verdagon.dev/blog/linear-types-borrowing"
            , "https://waitbutwhy.com/2017/03/elon-musk-post-series.html"
            , "https://wordcraft-writers-workshop.appspot.com/"
            , "https://www.centauri-dreams.org/2006/11/24/barnards-star-and-the-wait-equation/"
            , "https://www.cerebras.net/blog/beyond-ai-for-wafer-scale-compute-setting-records-in-computational-fluid-dynamics/"
            , "https://www.cognition.ai/"
            , "https://www.cryonicsarchive.org/library/chemical-brain-preservation/"
            , "https://www.cs.cmu.edu/~./yiming/"
            , "https://www.feynmanlectures.caltech.edu/II_09.html"
            , "https://www.folger.edu/explore/shakespeares-works/hamlet/read/"
            , "https://www.hustwit.com/"
            , "https://www.icpsr.umich.edu/web/ICPSR/studies/37932"
            , "https://www.mattridley.co.uk/blog/gene-editing-and-eugenics/"
            , "https://www.semafor.com/article/01/09/2023/microsoft-eyes-10-billion-bet-on-chatgpt"
            , "https://www.spencergreenberg.com/"
            , "https://www8.austlii.edu.au/cgi-bin/viewdoc/au/cases/vic/VCC/2013/70.html"
            , "https://dynomight.net/automated/"
            , "https://sander.ai/2020/09/01/typicality.html"
            , "https://www.chiark.greenend.org.uk/~martinh/poems/complete_housman.html"
            , "https://acoup.blog/2020/06/19/collections-the-battle-of-helms-deep-part-viii-the-mind-of-saruman/"
            , "https://ea.greaterwrong.com/posts/123z5mgQdiv57wabc/ingredients-for-creating-disruptive-research-teams?format=preview&theme=classic"
            , "https://arbital.greaterwrong.com/p/fake_url/?format=preview&theme=classic"
            ]

badLinks =  setLike ["https://1d4chan.org/wiki/Tale_of_an_Industrious_Rogue,_Part_I"
            , "http://2chan.us/wordpress/2012/07/12/c82-genre-stats/"
            , "https://ascii.textfiles.com/archives/1717"
            , "https://augmentingcognition.com/ltm.html"
            , "http://aurellem.org/vba-clojure/html/total-control.html"
            , "http://bactra.org/weblog/algae-2012-09.html"
            , "https://bakabt.me/torrent/159362/umineko-no-naku-koro-ni-music-collection-flac.html"
            , "http://bastiat.org/en/twisatwins.html"
            , "http://betsofbitco.in/list?status=available&category=All&sorting=-moderationTime"
            , "http://bit-player.org/2021/three-months-in-monte-carlo"
            , "http://blog.dansimons.com/2013/03/what-effect-size-would-you-expect.html"
            , "http://blog.darcs.net/2010/11/coming-in-darcs-28-new-features.html"
            , "http://blog.platypope.org/2012/4/5/restore-features/"
            , "http://blog.sigfpe.com/2012/12/shuffles-bayes-theorem-and-continuations.html"
            , "https://boinngerionn.blog.fc2.com/blog-entry-203.html"
            , "https://bugs.darcs.net/issue346"
            , "https://buttercupfestival.com/green/index.htm"
            , "http://catb.org/~esr/writings/taoup/html/ch05s01.html"
            , "https://catless.ncl.ac.uk/risks/16.41.html"
            , "http://chronopause.com/chronopause.com/index.php/2011/02/11/thus-spake-curtis-henderson-part-5/"
            , "http://clickotron.com/"
            , "http://colab.research.google.com/"
            , "https://danfrank.ca/the-most-loved-and-hated-classics-according-to-goodreads-users/"
            , "https://darcs.net/GSoC/2010-Cache"
            , "https://darkdata.illinois.edu/"
            , "https://darwin-online.org.uk/content/frameset?pageseq=1&itemID=F1548.1&viewtype=text"
            , "http://dev.kanotype.net:8003/deepdanbooru/"
            , "https://duplicity.nongnu.org/"
            , "http://eepurl.com/cGAN7L"
            , "https://eprints.lincoln.ac.uk/id/eprint/1932/1/MetaAnalysisPaper.pdf"
            , "http://eprints.nottingham.ac.uk/439/1/Willmot_NO_synthase_JFRBM.pdf"
            , "http://esr.ibiblio.org/?p=7183"
            , "http://eurfa.org.uk/pangur_ban.php"
            , "https://eztest.com/ez-test-tubes/"
            , "https://feeds.feedburner.com/longbets"
            , "http://folding.stanford.edu/English/FAQ-Diseases"
            , "https://ftp.cs.ucla.edu/pub/stat_ser/r414.pdf"
            , "http://gainax.fr/"
            , "http://geneatlas.roslin.ed.ac.uk/"
            , "http://geroprotectors.org/?page=8&q%5Bs%5D=organism_name+asc"
            , "http://gettermario.dynamicforum.net/t974p15-entretien-go-nagai-hideaki-anno"
            , "http://glench.com/closed-source/dictionaryofnumbers/"
            , "https://gptprompts.wikidot.com/linguistics:word-in-context"
            , "https://grantland.com/one-hundred-years-arm-bars-gracie-jiu-jitsu-mma/"
            , "https://hn-sicp.pbworks.com/w/page/9077106/FrontPage"
            , "https://hoaxes.org/archive/permalink/the_great_moon_hoax"
            , "http://homepage3.nifty.com/mana/miyazaki-annno.html"
            , "http://host.robots.ox.ac.uk/pascal/VOC/"
            , "https://ignorethecode.net/blog/2010/04/20/footnotes/"
            , "http://images.google.com/images?amp;q=henry+darger&gbv=2&biw=1218&bih=673"
            , "http://itre.cis.upenn.edu/~myl/languagelog/archives/005526.html"
            , "http://jidinews.com/innernews/innernews/event/1204.html"
            , "https://kanzaki.sub.jp/archives/000282.html"
            , "https://ldsc.broadinstitute.org/about/"
            , "https://learnyouahaskell.com/functors-applicative-functors-and-monoids#monoids"
            , "http://libgen.org/search.php?req=%22wheel+of+time%22"
            , "http://linuxmafia.com/faq/Essays/marriage.html"
            , "http://lists.urth.net/pipermail/urth-urth.net/2010-December/019137.html"
            , "https://www.baen.com/Chapters/1439133476/1439133476___5.htm"
            , "https://medsforbitcoin.com/"
            , "http://messybeast.com/cats-meat-man.htm"
            , "https://nectarcreek.com/"
            , "https://neomarxisme.com/biography.html"
            , "http://neuralnetworksanddeeplearning.com/"
            , "https://new.nubrain.com/shop/index.php?route=product/product&keyword=modafinil&category_id=0&product_id=58"
            , "https://news.bbc.co.uk/2/hi/uk_news/3723839.stm"
            , "http://npc.people.com.cn/n1/2020/1227/c14576-31980014.html"
            , "https://nrl.northumbria.ac.uk/id/eprint/875/1/Scholey_Consumption%20of%20cocoa%20flavanols.pdf"
            , "https://p2pfoundation.ning.com/forum/topics/bitcoin-open-source"
            , "https://people.tamu.edu/~stevesmith/SmithMemory/SmithRothkopf1984.pdf"
            , "http://permalink.gmane.org/gmane.science.linguistics.wikipedia.english/110790"
            , "https://philsci-archive.pitt.edu/5314/1/Griffiths_%26_Wilkins.doc"
            , "http://plaza.harmonix.ne.jp/~onizuka/literal/EVA26.txt"
            , "http://popsych.org/should-psychological-neuroscience-research-be-funded/"
            , "http://precedings.nature.com/documents/3697/version/1"
            , "http://prize.hutter1.net/"
            , "https://publicsearch.ndcourts.gov/default.aspx"
            , "http://radar.oreilly.com/2011/05/anonymize-data-limits.html"
            , "https://econwpa.ub.uni-muenchen.de/econ-wp/dev/papers/0507/0507004.pdf"
            , "https://5onwnspjvuk7cwvk.tor2web.org/"
            , "https://a16z.com/author/scott-kupor/"
            , "https://about.netflix.com/en/news/2017-on-netflix-a-year-in-bingeing"
            , "https://adage.com/node/1206366/printable/print"
            , "https://addons.mozilla.org/en-US/firefox/addon/lastpass-password-manager/"
            , "https://advancedfertility.com/2020/08/17/weight-bmi-and-fertility-and-ivf-success/"
            , "https://aeon.co/essays/why-fake-miniatures-depicting-islamic-science-are-everywhere"
            , "https://ai-alignment.com/"
            , "https://aidungeon.medium.com/ai-dungeon-dragon-model-upgrade-7e8ea579abfe"
            , "https://ai.meta.com/blog/harmful-content-can-evolve-quickly-our-new-ai-system-adapts-to-tackle-it/"
            , "https://ajcn.nutrition.org/content/69/5/842.full"
            , "https://ajph.aphapublications.org/cgi/content/abstract/94/9/1580"
            , "https://ajp.psychiatryonline.org/doi/abs/10.1176/appi.ajp.2020.19080834"
            , "https://aka.ms/beit" -- is actually Github underneath
            , "https://almanac.httparchive.org/en/2019/"
            , "https://andrewbadr.com/log/11/anonymizing-bitcoin/"
            , "https://anidb.net/tag/385/chartb"
            , "https://animesuperhero.com/forums/install/index.php?upgrade/"
            , "https://answers.google.com/answers/threadview/id/777105.html"
            , "https://antilop.cc/sr/vendors/24bb54ca7e.htm"
            , "https://apastyle.apa.org/products/publication-manual-7th-edition"
            , "https://api.repository.cam.ac.uk/server/api/core/bitstreams/7820cc59-9363-48fa-802e-a23aa2d8778d/content"
            , "https://api.research-repository.uwa.edu.au/ws/portalfiles/portal/11790041/Flematti_MS.pdf"
            , "https://inferkit.com/"
            , "https://apps.apple.com/us/app/ankimobile-flashcards/id373493387"
            , "https://apps.dtic.mil/dtic/tr/fulltext/u2/a224049.pdf"
            , "https://apps.dtic.mil/sti/pdfs/ADA099503.pdf"
            , "https://arbital.com/p/edge_instantiation/"
            , "https://archive.foolz.us/a/thread/77196171/#77207238"
            , "https://archive.ilr.cornell.edu/download/9851"
            , "https://archive.is/"
            , "https://archiveofourown.org/works/3673335"
            , "https://archive-ouverte.unige.ch/files/downloads/0/0/0/2/5/6/4/3/unige_25643_attachment01.pdf"
            , "https://archives.haskell.org/code.haskell.org/monadius/Monadius/Demo.hs"
            , "https://arstechnica.com/information-technology/2013/04/the-rise-and-fall-of-amd-how-an-underdog-stuck-it-to-intel/3/"
            , "https://ase.uva.nl/binaries/content/assets/subsites/amsterdam-school-of-economics/research/uva-econometrics/dp-2013/1303.pdf"
            , "https://www.astralcodexten.com/"
            , "https://aur.archlinux.org/packages/anki20-bin"
            , "https://aws.amazon.com/blogs/opensource/keeping-open-source-open-open-distro-for-elasticsearch/"
            , "https://azure.microsoft.com/en-us/blog/microsoft-showcases-the-azure-cloud-switch-acs/"
            , "https://babel.hathitrust.org/cgi/pt?id=mdp.39015039380632&view=1up&seq=333"
            , "https://bam-dataset.org/"
            , "https://bartokdesign.com/"
            , "https://bayes.wustl.edu/etj/articles/general.background.ps.gz"
            , "https://beautifultaiwantea.com/"
            , "https://beerconnoisseur.com/articles/schlitz-how-milwaukees-famous-beer-became-infamous"
            , "https://bellroy.com/"
            , "https://benbest.com/nutrceut/melatonin.html#negative"
            , "https://berkshirehathaway.com/letters/2016ltr.pdf"
            , "https://bgr.com/general/google-services-shut-down-study/"
            , "https://bibliophilly.library.upenn.edu/viewer.php?id=Ms.%20Codex%201248#page/244/mode/2up"
            , "https://bigquery.cloud.google.com/table/fh-bigquery:reddit_comments.2015_05"
            , "https://bioinfo.pl/pmid:17597168"
            , "https://bitbucket.org/djhshih/argparser"
            , "https://bitcoincharts.com/charts/mtgoxUSD#rg180zczsg2013-07-23zeg2013-07-23ztgSzm1g10zm2g25zv"
            , "https://bitcoins-code.de/"
            , "https://bitcointalk.org/index.php?topic=14828.0"
            , "https://bjo.bmj.com/content/93/8/997"
            , "https://bjsm.bmj.com/content/46/16/1144.2.abstract"
            , "https://blog.23andme.com/articles/chocolate-its-complicated"
            , "https://blog.darknedgy.net/technology/2020/05/02/0/"
            , "https://blog.johantibell.com/2011/08/results-from-state-of-haskell-2011.html"
            , "https://blog.ml.cmu.edu/2022/01/21/why-spectral-normalization-stabilizes-gans-analysis-and-improvements/"
            , "https://blog.mozilla.org/security/2010/03/31/plugging-the-css-history-leak/"
            , "https://blog.nuclino.com/the-simple-genius-of-checklists-from-b-17-to-the-apollo-missions"
            , "https://blogs.nature.com/news/2011/09/reliability_of_new_drug_target.html"
            , "https://blogs.nvidia.com/blog/gaugan-photorealistic-landscapes-nvidia-research/"
            , "https://blogs.princeton.edu/notabilia/2020/05/20/what-could-be-better-pairing-and-comparing-the-scheide-and-kane-copies-of-fifteenth-century-books/"
            , "https://www.scientificamerican.com/blog/observations/what-the-history-of-math-can-teach-us-about-the-future-of-ai/"
            , "https://blog.torproject.org/trip-report-october-fbi-conference/"
            , "https://blog.x.com/en_us/topics/company/2021/imperfect-by-design"
            , "https://bluelight.org/"
            , "https://bmcmedresmethodol.biomedcentral.com/articles/10.1186/1471-2288-4-13"
            , "https://bmcneurosci.biomedcentral.com/articles/10.1186/1471-2202-6-23"
            , "https://bmcpublichealth.biomedcentral.com/articles/10.1186/1471-2458-7-159#B28"
            , "https://bmcvetres.biomedcentral.com/articles/10.1186/s12917-017-0987-6"
            , "https://boardgamegeek.com/boardgame/148931/coup-reformation"
            , "https://boa.unimib.it/retrieve/handle/10281/23046/29556/Watching_alone_relational_goods.pdf"
            , "https://book.realworldhaskell.org/read/data-structures.html#id637702"
            , "https://books.google.com/books?id=Cr251kFBy5QC"
            , "https://book.webtypography.net/"
            , "https://boston.conman.org/2013/01/22.2"
            , "https://brainworkshop.sourceforge.net/tutorial.html"
            , "https://bsapubs.onlinelibrary.wiley.com/doi/full/10.2307/2656597"
            , "https://buddhism-for-vampires.com/"
            , "https://bugs.debian.org/cgi-bin/bugreport.cgi?bug=217243"
            , "https://bugs.launchpad.net/ubuntu/+source/unity-greeter/+bug/1538615"
            , "https://cabinetmagazine.org/issues/64/lucas.php"
            , "https://caes.ucdavis.edu/news/articles/2018/february/isolating-embryonic-stem-cells-in-cows-just-got-easier"
            , "https://camelcamelcamel.com/"
            , "https://capitalteas.com/Himalayan_Golden_Monkey_organic_p/23495.htm"
            , "https://capsuleconnection.com/"
            , "https://case.edu/ech/articles/r/rowfant-club"
            , "https://casetext.com/case/united-states-v-5044-bitcoins"
            , "https://casual-effects.com/markdeep/features.md.html#basicformatting/admonitions"
            , "https://cdm16630.contentdm.oclc.org/digital/collection/p16630coll2/id/534"
            , "https://cep.lse.ac.uk/pubs/download/dp1490.pdf"
            , "https://cfa.org/about-cfa/"
            , "https://chrome.google.com/webstore/detail/singlefile/mpiodijhokgodhhofbcjdecpffjipkle"
            , "https://chroniclingamerica.loc.gov/newspapers/"
            , "https://ciechanow.ski/lights-and-shadows/"
            , "https://cis.org/articles/2010/teen-study.pdf"
            , "https://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.108.7127&rep=rep1&type=pdf"
            , "https://clagnut.com/blog/2395"
            , "https://clarkesworldmagazine.com/watts_01_10/"
            , "https://clinicalepigeneticsjournal.biomedcentral.com/articles/10.1186/s13148-021-01218-y#Tab1"
            , "https://classic.clinicaltrials.gov/ct2/show/NCT03548935"
            , "https://cloud.google.com/tpu/pricing"
            , "https://code.google.com/archive/p/amphetype"
            , "https://code.visualstudio.com/blogs/2021/09/29/bracket-pair-colorization"
            , "https://colab.research.google.com/drive/1LiWxqJJMR5dg4BxwUgighaWp2U_enaFd#offline=true&sandboxMode=true"
            , "https://collections.library.yale.edu/catalog/2037169"
            , "https://collider.com/hideaki-anno-evangelion-interview/"
            , "https://comicsalliance.com/ask-chris-45-my-little-pony-meets-the-justice-league/"
            , "https://community.arm.com/arm-community-blogs/b/high-performance-computing-blog/posts/deep-learning-episode-4-supercomputer-vs-pong-ii"
            , "https://community.haskell.org/~gwern/hcorpus/"
            , "https://console.cloud.google.com/bigquery?project=danbooru1"
            , "https://corante.com/drug-prices/erooms-law/"
            , "https://core.ac.uk/download/pdf/160476861.pdf"
            , "https://cosmosmagazine.com/biology/don-t-believe-the-mice"
            , "https://course.fast.ai/videos/?lesson=7"
            , "https://coveryourtracks.eff.org/static/browser-uniqueness.pdf"
            , "https://creativecommons.org/licenses/by-nc/3.0/us/"
            , "https://creyos.com/"
            , "https://cro.sagepub.com/content/15/5/252.full.pdf+html"
            , "https://cryptome.org/2013/10/sadler-white-complaint.pdf"
            , "https://crypto.stackexchange.com/questions/5831/what-is-the-progress-on-the-mit-lcs35-time-capsule-crypto-puzzle"
            , "https://csimq-journals.rtu.lv/article/download/csimq.2019-21.04/1744"
            , "https://csrc.nist.gov/csrc/media/publications/conference-paper/1998/10/08/proceedings-of-the-21-nissc-1998/documents/early-cs-papers/karg74.pdf"
            , "https://ctc.usma.edu/wp-content/uploads/2016/11/Cradle-to-Grave2.pdf"
            , "https://cyber.harvard.edu/events/luncheon/2011/10/makohill"
            , "https://dailyvoice.com/connecticut/norwalk/police-fire/norwalk-police-bust-major-marijuana-operation-after-finding-pot-in-mail/582175/"
            , "https://dalspace.library.dal.ca/bitstream/handle/10222/56021/Heffernan-Amy-MSc-KINE-Nov-14.pdf?sequence=1"
            , "https://danbooru.donmai.us/wiki_pages/34230"
            , "https://darknetlive.com/post/ncidetf-adds-another-vendor-to-their-arrested-vendor-list/"
            , "https://datasetsearch.research.google.com/search?query=poem+OR+poetry&docid=T3haTlmLU9Dl6xqYAAAAAA%3D%3D"
            , "https://data.worldbank.org/indicator/NY.GNP.PCAP.PP.CD"
            , "https://deadline.com/2011/02/scott-rudin-closes-la-office-is-sony-move-imminent-105993/#comment-709877"
            , "https://deadspin.com/the-myth-of-the-myth-of-the-hot-hand-1588112937/"
            , "https://dee.su/liberte"
            , "https://dept.wofford.edu/neuroscience/neuroseminar/pdffall2006/rusted-mem3.pdf"
            , "https://derpibooru.org/tags/generator-colon-thisponydoesnotexist"
            , "https://devblogs.microsoft.com/oldnewthing/"
            , "https://developer.mozilla.org/en-US/docs/Web/CSS/@media/prefers-color-scheme"
            , "https://developer.nvidia.com/cuda-downloads"
            , "https://developer.x.com/en/docs/x-api/v1/rules-and-filtering/search-operators"
            , "https://dharmaoverground.org/web/guest/discussion/-/message_boards/message/2718243#_com_liferay_message_boards_web_portlet_MBPortlet_message_2718243"
            , "https://digitalcommons.unl.edu/cgi/viewcontent.cgi?article=1024&context=vpc15"
            , "https://discord.com/invite/7RgdJZy"
            , "https://disease-connect.org/"
            , "https://dl.dropboxusercontent.com/u/85192141/music/surreacheese-feta-magicalcolorbossa.ogg"
            , "https://dnd.wizards.com/articles/news/dungeons-dragons-teams-my-little-pony"
            , "https://docs.ankiweb.net/filtered-decks.html#filtered-decks--cramming"
            , "https://donate.torproject.org/"
            , "https://droitwichstandard.co.uk/news/droitwich-student-jailed-two-years-importing-cocaine-costa-rica/"
            , "https://drugs-forum.com/threads/116671/"
            , "https://dspace.mit.edu/handle/1721.1/10589"
            , "https://dual-n-back.com/nback.html"
            , "https://duckduckgo.com/bangs#bangs-list"
            , "https://dzone.com/articles/mechanical-sympathy"
            , "https://e621.net/posts"
            , "https://eab.sagepub.com/content/23/1/3.short"
            , "https://economics.stanford.edu/sites/default/files/economics_of_scaleup_20180316.pdf"
            , "https://ec.toranoana.jp/joshi_r/ec/item/040030048682/"
            , "https://effectuation.org/hubfs/Journal%20Articles/2017/05/Do-serial-entrepreneurs-1.pdf"
            , "https://eg-2.hatenablog.com/"
            , "https://ehp.niehs.nih.gov/1104789/"
            , "https://ehp.niehs.nih.gov/doi/full/10.1289/ehp.1510037"
            , "https://eiga.com/news/20110830/11/"
            , "https://elifesciences.org/articles/66920"
            , "https://en.chessbase.com/post/a-history-of-cheating-in-chess-4"
            , "https://endlessvn.io/"
            , "https://en.touhouwiki.net/wiki/%E5%87%8B%E5%8F%B6%E6%A3%95"
            , "https://environhealthprevmed.biomedcentral.com/articles/10.1186/s12199-020-00865-6"
            , "https://en.wik%20ipedia.org/wiki/Va%20nishing_bird_cage"
            , "https://en.wikip%20edia.org/wiki/The_%20Prestige_(film)"
            , "https://en.wikipedia.org/wiki/Special:Random"
            , "https://en.wikipedia.org/w/index.php?title=Genome-wide_complex_trait_analysis&oldid=871165308"
            , "https://eprints.whiterose.ac.uk/97780/"
            , "https://serendipityrecs.com/"
            , "https://ergodox-ez.com/"
            , "https://ero.sagepub.com/content/1/3/2332858415599972?full"
            , "https://esajournals.onlinelibrary.wiley.com/doi/pdf/10.1890/ES10-00142.1"
            , "https://escholarship.org/uc/item/5bv8c7p3"
            , "https://espace.library.uq.edu.au/view/UQ:281052"
            , "https://ethics.emory.edu/who-we-are/our-people/director.html"
            , "https://www.bl.uk/OrderDetails.do?uin=uk.bl.ethos.486142"
            , "https://ethereum.org/en/developers/docs/consensus-mechanisms/pos/faqs/"
            , "https://eurekamag.com/"
            , "https://eusprig.org/horror-stories.htm"
            , "https://everyoneishappy.com/"
            , "https://everything2.com/title/A+crow+shook+down+on+me"
            , "https://every.to/cybernaut/caught-in-the-study-web"
            , "https://evigio.com/post/generating-new-watch-designs-with-stylegan"
            , "https://examine.com/supplements/Piracetam/"
            , "https://exrx.net/Nutrition/Antioxidants/Antioxidants"
            , "https://f1000research.com/articles/3-82/v1"
            , "https://fdaaa.trialstracker.net/"
            , "https://fifteen.ai/"
            , "https://finance.yahoo.com/"
            , "https://fiscaldata.treasury.gov/datasets/historical-debt-outstanding/"
            , "https://fis.fda.gov/sense/app/d10be6bb-494e-4cd2-82e4-0135608ddc13/sheet/45beeb74-30ab-46be-8267-5756582633b4/state/analysis"
            , "https://fivethirtyeight.com/features/the-complicated-legacy-of-a-panda-who-was-really-good-at-sex/"
            , "https://flatisjustice.moe/TADNE"
            , "https://floatingleaves.com/index.php?main_page=index&cPath=29"
            , "https://fn.bmj.com/content/93/1/F45.short"
            , "https://fnb.sagepub.com/content/24/4_suppl2/S129.full.pdf"
            , "https://folkrnn.org/"
            , "https://fontsinuse.com/typefaces/40498/ed-interlock"
            , "https://food52.com/blog/15159-we-taste-tested-17-types-of-sparkling-water-here-s-what-happened"
            , "https://fortune.com/2013/05/15/dirty-medicine/"
            , "https://forums.somethingawful.com/showthread.php?threadid=3882695"
            , "https://fred.stlouisfed.org/series/JPNURYNAA"
            , "https://freedom-to-tinker.com/2011/05/24/you-might-also-privacy-risks-collaborative-filtering/"
            , "https://fs.blog/decision-journal/"
            , "https://colab.research.google.com/drive/1O5XbpMRU9i83mLAiTrMufCqmImgTRI7A/"
            , "https://gallica.bnf.fr/ark:/12148/bpt6k851127r/"
            , "https://gazette.com/military/witnesses-cadet-got-drugs-from-online-black-market-and-sold-them-in-dorms/article_0c8b524b-99f5-5c9e-ae44-cb57e4d7234e.html"
            , "https://gcta.freeforums.net/thread/213/analysis-greml-results-multiple-cohorts"
            , "https://genepi.qimr.edu.au/general/TwinPowerCalculator/"
            , "https://geneticalliance.org.uk/information/services-and-testing/how-can-i-access-preimplantation-genetic-diagnosis/#Question6"
            , "https://genius.com/The-notorious-big-ten-crack-commandments-lyrics"
            , "https://genomebiology.biomedcentral.com/articles/10.1186/s13059-018-1506-1"
            , "https://genomemedicine.biomedcentral.com/articles/10.1186/s13073-014-0091-5"
            , "https://georgianjournal.ge/society/34644-michel-houellebecq-a-french-author-shares-his-views-with-georgian-audience.html"
            , "https://getd.libs.uga.edu/pdfs/sutherland_pierre_201212_ma.pdf"
            , "https://gigascience.biomedcentral.com/articles/10.1186/2047-217X-3-10"
            , "https://gigazine.net/news/20190812-death-note-anonymity-entropy/"
            , "https://gist.github.com/SigridK/c16ddc7b0f2a5bc01ea23d69569c6c0b"
            , "https://gitgud.io/AuroraPurgatio/aurorapurgatio"
            , "https://github.com/google-research/google-research/tree/master/supcon"
            , "https://github.com/lightonai/akronomicon"
            , "https://github.com/microsoft/unadversarial"
            , "https://gitlab.com/cryptsetup/cryptsetup/-/issues/19"
            , "https://gitlab.developers.cam.ac.uk/cst/dtg/trvedata/local-first/-/commit/7a8819e817a85173af7033e64bcdcc5054b9af50?expanded=1#e74ca419c79e4a87cb170f6eb8a6c0d2719e1c73_0_726"
            , "https://gitlab.haskell.org/ghc/ghc/-/issues/2143"
            , "https://git-scm.com/book/en/v2/Customizing-Git-Git-Hooks"
            , "https://gizmodo.com/generation-cryo-fighting-death-in-the-frozen-unknown-1786446378"
            , "https://godanriver.com/news/danville/three-suspects-arrested-charged-with-mailing-meth-into-county/article_d73f9598-c839-11e4-9dbd-974577bb449e.html"
            , "https://granta.com/the-man-with-two-heads/"
            , "https://greekreporter.com/2010/12/19/inside-the-minds-of-the-parlapanides-brothers/"
            , "https://groups.google.com/g/brain-training/c/DdeZzeXEMyE"
            , "https://groups.yahoo.com/neo/groups/catsandkittens/conversations/messages/188981"
            , "https://gsejournal.biomedcentral.com/articles/10.1186/s12711-016-0280-3"
            , "https://gwern.shinyapps.io/orderStatisticsIncreasedVariance/"
            , "https://h01-dot-neuroglancer-demo.appspot.com/#!gs://h01-release/assets/library_state.json"
            , "https://habr.com/en/articles/429602/"
            , "https://hacks.mozilla.org/2021/05/improving-firefox-stability-on-linux/"
            , "https://hal.science/hal-00904097/document#pdf"
            , "https://hansard.parliament.uk/Lords/1986-06-12/debates/56392d7a-e823-45be-80b6-26711300c7aa/GruinardIslandCostOfDecontamination"
            , "https://hardcoresoftware.learningbyshipping.com/p/061-bsod-to-watson-the-reliability"
            , "https://harmreductionjournal.biomedcentral.com/articles/10.1186/s12954-019-0308-4"
            , "https://hashcat.net/wiki/doku.php?id=mask_attack"
            , "https://haveibeenpwned.com/"
            , "https://hazuma.hatenablog.com/entry/20090511/1242018681"
            , "https://hbr.org/2019/12/can-you-know-too-much-about-your-organization"
            , "https://hcommons.org/deposits/objects/hc:20220/datastreams/CONTENT/content?download=true#pdf"
            , "https://help.duckduckgo.com/duckduckgo-help-pages/results/syntax/"
            , "https://www.nasa.gov/history/rogersrep/v2appf.htm"
            , "https://hivemind-repo.s3-us-west-2.amazonaws.com/twdne3/twdne3.onnx"
            , "https://hivemind-repo.s3-us-west-2.amazonaws.com/twdne3/twdne3.pt"
            , "https://hn.algolia.com/?query=%22Long%20Bets%22&sort=byDate&prefix&page=0&dateRange=all&type=all"
            , "https://hollisarchives.lib.harvard.edu/repositories/4/archival_objects/1033884"
            , "https://home.inklingmarkets.com/recent/markets"
            , "https://hoogle.haskell.org/?hoogle=IO_a_-%3E_IO_ThreadId"
            , "https://hrcak.srce.hr/file/210"
            , "https://huggingface.co/spaces/teven-projects/calculator"
            , "https://hum.sagepub.com/content/30/5/431.full.pdf+html"
            , "https://icosahedron.website/@halcy/101654023952557254"
            , "https://ideas.4brad.com/has-uber-already-beaten-private-ownership-cost"
            , "https://ide.mit.edu/sites/default/files/publications/Multi-Sided%20Platform%20Strategy,%20Taxation%20and%20Regulation%20October%202019.pdf#page=14"
            , "https://ieeexplore.ieee.org/xpls/abs_all.jsp?arnumber=602492"
            , "https://if50.substack.com/p/1999-king-of-dragon-pass"
            , "https://sigbovik.org/2019/"
            , "https://i.imgur.com/jzZKreU.png"
            , "https://ilovetypography.com/2019/03/14/the-first-printed-math-books/"
            , "https://imagelibrary.bgu.ac.il/pf.tlx/O6ORSOx-nut"
            , "https://imgur.com/a/LE80ogv"
            , "https://inews.co.uk/opinion/why-i-donate-my-sperm-over-facebook-and-have-fathered-23-children-194142"
            , "https://infidels.org/library/modern/richard-carrier-kooks/"
            , "https://interviews.slashdot.org/story/11/09/06/1458254/Kevin-Kelly-Answers-Your-Questions"
            , "https://intrade.com/jsp/intrade/common/c_cd.jsp?conDetailID=702407&z=1285870999458"
            , "https://iopscience.iop.org/article/10.1088/1748-3190/ac253a"
            , "https://iqtest.com/"
            , "https://irs.princeton.edu/sites/g/files/toruqf276/files/event/uploads/economics_of_scaleup_20171004.pdf"
            , "https://isfdb.org/cgi-bin/pl.cgi?261005"
            , "https://iterative.capital/thesis/"
            , "https://it.slashdot.org/comments.pl?sid=2679325&cid=39089165"
            , "https://jacobsschool.ucsd.edu/news/release/791?id=791"
            , "https://jalopnik.com/you-have-no-idea-how-insanely-complex-modern-headlights-1840509448"
            , "https://jamestown.org/wp-content/uploads/2021/05/The-Prize-Why-Taiwan-and-its-Place-in-the-Global-Semiconductor-Supply-Chian-Matter-to-the-United-States.pdf#page=21"
            , "https://japanintercultural.com/free-resources/articles/over-worked-and-underpaid-japanese-employees-feel-the-burden-of-sabisu-zangyo/"
            , "https://jasbsci.biomedcentral.com/articles/10.1186/s40104-018-0304-7"
            , "https://jcsm.aasm.org/doi/10.5664/jcsm.7132"
            , "https://jigsaw.w3.org/css-validator/#validate-by-input"
            , "https://jme.bmj.com/content/37/4/249.abstract"
            , "https://jnnp.bmj.com/content/72/2/179.full"
            , "https://jn.nutrition.org/content/141/2/261"
            , "https://joshdean.com/sites/default/files/articles/feat_clones44.pdf"
            , "https://joshmitteldorf.scienceblog.com/2014/03/25/life-extension-supplements-a-reality-check/"
            , "https://jotengine.com/transcriptions/Q0I0i33TaqCa9w4In0ZQCg"
            , "https://journalnow.com/business/business_news/local/targacept-sale-to-catalyst-is-complete/article_8a0008c4-4dc2-5770-81db-758e527f177b.html"
            , "https://journals.ametsoc.org/view/journals/clim/18/23/jcli3593.1.xml"
            , "https://journals.asm.org/doi/10.1128/mbio.00036-12"
            , "https://journals.le.ac.uk/index.php/pst/issue/archive"
            , "https://journals.lww.com/greenjournal/fulltext/2003/03000/a_randomized_trial_of_docosahexaenoic_acid.11.aspx"
            , "https://journals.physiology.org/doi/full/10.1152/ajpregu.2000.278.4.r905"
            , "https://journals.plos.org/plosone/article?id=10.1371/journal.pone.0201246"
            , "https://journals.sagepub.com/doi/full/10.1177/2515245920919667"
            , "https://journaltimes.com/news/local/crime-and-courts/woman-accused-of-receiving-pot-by-mail/article_3da750f2-96f9-53e9-b771-b1d88bb27368.html"
            , "https://jpet.aspetjournals.org/content/296/3/849"
            , "https://jukebox.openai.com/"
            , "https://justpaste.it/7eovk"
            , "https://jyllands-posten.dk/indland/ECE7542044/To-m%C3%A6nd-afsl%C3%B8ret-med-over-et-ton-doping/"
            , "https://kettl.co/"
            , "https://kilthub.cmu.edu/articles/What_Went_Wrong_Reflections_on_Science_by_Observation_and_The_Bell_Curve/6493139/files/11937863.pdf#page=2"
            , "https://knowyourmeme.com/memes/tendies-stories"
            , "https://koeln.ccc.de/archiv/cyphernomicon/chapter14/14.5.html"
            , "https://kotaku.com/dont-let-a-little-thing-like-a-sex-video-slow-you-down-5856321"
            , "https://kyunghyuncho.me/brief-summary-of-the-panel-discussion-at-dl-workshop-icml-2015/"
            , "https://lareviewofbooks.org/article/the-secret-history-of-dune/"
            , "https://latanyasweeney.org/cv.html#survey"
            , "https://latitude.io/blog/introducing-ai-dungeon-translate/"
            , "https://leaderboard.allenai.org/break_high_level/submissions/public"
            , "https://upworthyscience.com/a-star-surgeon-left-a-trail-of-dead-patients-and-his-whistleblowers-were-punished/"
            , "https://learn.adafruit.com/adafruit-feather-32u4-adalogger"
            , "https://learn.microsoft.com/en-us/archive/blogs/larryosterman/one-in-a-million-is-next-tuesday"
            , "https://leme.me/verah/mp3/?C93/Lost%20Garden%20%E2%80%94%20ENIGMATIC%20LINER%20%5BMP3-V0%5D%5BC93%5D#trk6"
            , "https://letterformarchive.org/news/the-complete-commercial-artist/"
            , "https://letters.temporarystate.net/entry/3/"
            , "https://library.bz/main/upload/"
            , "https://lichess.org/@/lichess/blog/exact-exacting-who-is-the-most-accurate-world-champion/YafSBxEA"
            , "https://link.springer.com/article/10.1007/BF02253535"
            , "https://link.springer.com/article/10.1007/s10645-019-09339-9"
            , "https://listserv.brown.edu/archives/cgi-bin/wa?A2=ind0001B&L=NAUSICAA&P=R748"
            , "https://lists.wikimedia.org/hyperkitty/list/wikimedia-l@lists.wikimedia.org/message/DC4YYUFMYS6CSOOPINPBR4FPS2L53BVE/"
            , "https://listudy.org/en"
            , "https://lizadaly.com/"
            , "https://lobste.rs/s/1d7whd/tales_from_trenches_ai_disaster_stories#c_le6tsr"
            , "https://longbets.org/363/"
            , "https://longnow.org/essays/richard-feynman-and-connection-machine/"
            , "https://longreads.com/2019/10/22/the-final-five-percent/"
            , "https://lostpinesyaupontea.com/products/light-roast-yaupon-tea"
            , "https://lukemuehlhauser.com/industrial-revolution/"
            , "https://lwn.net/Articles/286233/"
            , "https://machinelearning.apple.com/research/hey-siri"
            , "https://make.girls.moe/"
            , "https://marco.org/2011/04/09/facebooks-open-compute-project"
            , "https://martinottaway.com/rhemmen/really-big-picture/"
            , "https://mathoverflow.net/questions/35468/widely-accepted-mathematical-results-that-were-later-shown-to-be-wrong/35554#35554"
            , "https://mathoverflow.net/questions/879/most-interesting-mathematics-mistake"
            , "https://math.stackexchange.com/questions/349155/how-often-does-it-happen-that-the-oldest-person-alive-dies/388131#388131"
            , "https://math.stackexchange.com/questions/89030/expectation-of-the-maximum-of-gaussian-random-variables/89147#89147"
            , "https://mattsclancy.substack.com/p/remote-work-and-the-future-of-innovation"
            , "https://meaningness.com/geeks-mops-sociopaths"
            , "https://media.ccc.de/v/35c3-9778-open_source_firmware"
            , "https://media.githubusercontent.com/media/sarabander/sicp-pdf/master/sicp.pdf"
            , "https://media.nature.com/original/nature-assets/nature/journal/v533/n7604/extref/nature17671-s2.xlsx"
            , "https://media.springernature.com/full/springer-static/image/art%3A10.1186%2Fs12917-017-0987-6/MediaObjects/12917_2017_987_Fig7_HTML.gif"
            , "https://medicine.osu.edu/neuroscience/documents/nocturnal%20light%20exposure.pdf"
            , "https://medieval.bodleian.ox.ac.uk/catalog/manuscript_336"
            , "https://medium.com/better-humans/the-effects-of-caffeine-alcohol-and-exercise-on-sleep-analyzing-the-surprising-results-117330af2480g"
            , "https://medlineplus.gov/druginfo/meds/a602016.html#side-effects"
            , "https://meehl.umn.edu/sites/meehl.umn.edu/files/files/aumeehl2003sigtests-trimmed.mp3#.mp3"
            , "https://meltingasphalt.com/hallucinated-gods/"
            , "https://metacpan.org/release/LBROCARD/Net-VNC-0.36/view/bin/vnccapture"
            , "https://metrics.torproject.org/data.html"
            , "https://millercenter.org/the-presidency/presidential-speeches/march-23-1962-address-university-california-berkeley#dp-expandable-text"
            , "https://mnemosyne-proj.org/"
            , "https://models.aminer.cn/CogView/index.html"
            , "https://money.cnn.com/magazines/fortune/fortune_archive/2006/04/03/8373034/index.htm"
            , "https://www.bbc.com/future/article/20170531-my-dj-vu-is-so-bad-i-cant-tell-whats-real"
            , "https://moz.com/blog/google-alerts-vs-mention-vs-talkwalker"
            , "https://mpra.ub.uni-muenchen.de/74268/1/MPRA_paper_74268.pdf"
            , "https://mru.org/development-economics"
            , "https://mujoco.org/"
            , "https://myanimelist.net/mangalist/gwern"
            , "https://mymodafinil.net/armodafinil/"
            , "https://naldc.nal.usda.gov/download/CAT71326739/PDF"
            , "https://nansenundpiccard.de/de/Wir/Hanske"
            , "https://nap.nationalacademies.org/read/25259/chapter/2"
            , "https://nationalinterest.org/bookreview/the-fallacy-human-freedom-8652?nopaging=1"
            , "https://nces.ed.gov/naal/sample.asp"
            , "https://near.blog/this-anime-does-not-exist/"
            , "https://www.brondell.com/nebia-fixed-shower-arm/"
            , "https://cognitivefun.net/"
            , "https://newhumanist.org.uk/2365/lies-damn-lies-and-chinese-science"
            , "https://newrepublic.com/article/120178/problem-international-development-and-plan-fix-it"
            , "https://news.gallup.com/poll/222578/americans-weigh-shun-overweight-label.aspx"
            , "https://news.harvard.edu/gazette/story/2010/10/thinking-like-an-octopus/"
            , "https://news.microsoft.com/source/features/ai/openai-azure-supercomputer/"
            , "https://news.mit.edu/2014/algorithm-recovers-speech-from-vibrations-0804"
            , "https://newsroom.collegeboard.org/"
            , "https://news.samsung.com/global/sock-horror-mystery-of-missing-socks-is-solved-scientists-reveal-why-socks-go-missing-in-the-wash-and-how-likely-it-is-to-happen"
            , "https://news.slashdot.org/story/07/10/31/0328239/call-for-halt-to-wikipedia-webcomic-deletions"
            , "https://www.yahoo.com/news/shattered-inside-the-secret-battle-to-save-americas-undercover-spies-in-the-digital-age-100029026.html"
            , "https://news.ycombinator.com/item?id=17048329"
            , "https://nmteaco.com/Plum-Oolong_p_380.html"
            , "https://n.neurology.org/content/78/2/91.full"
            , "https://nori.com/"
            , "https://noscript.net/"
            , "https://nutritionj.biomedcentral.com/articles/10.1186/s12937-017-0269-y"
            , "https://nypost.com/2019/11/02/stanford-professor-who-changed-america-with-just-one-study-was-also-a-liar/"
            , "https://ods.od.nih.gov/factsheets/Magnesium-HealthProfessional/"
            , "https://old.gigaom.com/2013/03/13/chris-wetherll-google-reader/"
            , "https://oll.libertyfund.org/titles/detmold-the-historical-political-and-diplomatic-writings-vol-2"
            , "http://www.isuppli.com/Memory-and-Storage/News/Pages/Hard-Drive-Shipments-Rebound-to-Record-Level-in-2012.aspx"
            , "https://omega0.xyz/omega8008/ETJ-PS/cc5d.ps"
            , "https://omega0.xyz/omega8008/JaynesBookPdf.html"
            , "https://onlinelibrary.wiley.com/doi/full/10.1111/acel.12880"
            , "https://faseb.onlinelibrary.wiley.com/doi/abs/10.1096/fasebj.26.1_supplement.114.4"
            , "https://openai.com/index/dall-e-2/"
            , "https://openai.com/research/learning-to-summarize-with-human-feedback"
            , "https://openai.com/index/openai-five-defeats-dota-2-world-champions/"
            , "https://openai.fund/"
            , "https://openaipublic.blob.core.windows.net/webgpt-answer-viewer/index.html"
            , "https://openreview.net/forum?id=qVyeW-grC2k#google"
            , "https://opensnp.org/"
            , "https://opensource.org/license"
            , "https://orbis.stanford.edu/"
            , "https://backend.orbit.dtu.dk/ws/portalfiles/portal/101895512/Roomvent_2014_Paper_ID_148.pdf#page=2"
            , "https://osf.io/preprints/socarxiv/mbj9p/"
            , "https://osnadocs.ub.uni-osnabrueck.de/bitstream/urn:nbn:de:gbv:700-2008112111/2/E-Diss839_thesis.pdf"
            , "https://otago.ourarchive.ac.nz/handle/10523/2341"
            , "https://ourstarblazers.com/vault/78/"
            , "https://packages.debian.org/sid/x11/xprintidle"
            , "https://pages.jh.edu/jhumag/0697web/whiz.html"
            , "https://pain.wustl.edu/c/BasicResearch/documents/Chennature2001.pdf"
            , "https://papers.nips.cc/paper/2003/file/9fb7b048c96d44a0337f049e0a61ff06-Paper.pdf"
            , "https://paperswithcode.com/task/language-modelling"
            , "https://par.nsf.gov/servlets/purl/10013134"
            , "https://partner.steamgames.com/doc/steamdeck/faq"
            , "https://pastebin.com/GrV3uYh5"
            , "https://paste.laravel.io/f2419e15-ea7d-408a-8ff2-b8ee6d00ddd1/raw"
            , "https://patch.com/california/davis/davis-pair-arrested-after-cops-intercept-3-000-suspected-ecstasy-pills-mail-serve"
            , "https://patch-tag.com/"
            , "https://patents.google.com/patent/US20150124107"
            , "https://pay.reddit.com/r/DarkNetMarkets/comments/2i07pq/the_number_of_multisig_transactions_doubled_on_evo/"
            , "https://pcdb.santafe.edu/index.php"
            , "https://pcl.sitehost.iu.edu/rgoldsto/interrelated/interrelated.html"
            , "https://pcpartpicker.com/list/nwQnZ8"
            , "https://peerj.com/preprints/27137v1/"
            , "https://perma.cc/"
            , "https://phabricator.wikimedia.org/T270650"
            , "https://pharmacyreviewer.com/?q=modafinil&option=com_medicine&view=search"
            , "https://pharmrev.aspetjournals.org/content/57/1/79.long"
            , "https://physics.aps.org/articles/v7/47"
            , "https://physoc.onlinelibrary.wiley.com/doi/pdf/10.1113/jphysiol.2011.217919"
            , "https://pioneer.app/"
            , "https://pirate.london/real-fake-money-real-insecure-markets-updated-8760f5254645"
            , "https://pixelpoppers.com/2010/12/why-i-quit-wow-and-started-working-out/"
            , "https://pjreddie.com/darknet/yolo/"
            , "https://platform.openai.com/"
            , "https://play.aidungeon.com/main/home"
            , "https://player.vimeo.com/video/427943452"
            , "https://play.google.com/store/apps/details?id=com.ankerl.singlenback"
            , "https://plus.google.com/u/0/103530621949492999968/posts/AThvaCXCSp2"
            , "https://pni.princeton.edu/john-hopfield/john-j.-hopfield-now-what"
            , "https://poemanalysis.com/ee-cummings/r-p-o-p-h-e-s-s-a-g-r/"
            , "https://poets.org/poem/design"
            , "https://polisen.se/Aktuellt/Nyheter/2015/Mars/Polisen-stoppade-droghandel-pa-natet/"
            , "https://pol.is/home"
            , "https://politicalscience.osu.edu/faculty/jmueller/MID11TSM.PDF"
            , "https://pone.dev/"
            , "https://popcon.debian.org/"
            , "https://poststar.com/news/local/crime-courts/former-computer-shop-operator-pleads-guilty-to-drug-charges/article_b42b976e-8bf9-11e3-a353-001a4bcf887a.html"
            , "https://journals.sagepub.com/doi/full/10.1177/1745691612459519"
            , "https://practicaltypography.com/rebuilding-the-typographic-society.html"
            , "https://practicaltypography.com/web-and-email-addresses.html"
            , "https://predictionbook.com/predictions/3693"
            , "https://press.etc.cmu.edu/journals/well-played-vol-4-no-1"
            , "https://priceonomics.com/why-is-art-expensive/"
            , "https://prisons.org.uk/worker-at-brixton-jail-charged-with-trying-to-buy-gun-and-ammo/"
            , "https://proceedings.neurips.cc/paper/2016/hash/7ef605fc8dba5425d6965fbd4c8fbe1f-Abstract.html"
            , "https://programmablesearchengine.google.com/about//cse?cx=009114923999563836576%3A1eorkzz2gp4&q=Firefly+%22Cowboy+Bebop%22"
            , "https://projecteuclid.org/journals/bernoulli/volume-2/issue-4/Exponential-convergence-of-Langevin-distributions-and-their-discrete-approximations/bj/1178291835.full"
            , "https://project-rainbowcrack.com/buy.php"
            , "https://psmag.com/social-justice/diy-diagnosis-extreme-athlete-uncovered-genetic-flaw-88763/"
            , "https://pss.sagepub.com/content/24/4/562.full"
            , "https://osf.io/preprints/psyarxiv/kq4mn/"
            , "https://psychology.gatech.edu/renglelab/2010/shipsteadredickengle.pdf"
            , "https://psych.wustl.edu/memory/Roddy%20article%20PDF%27s/Lyle%20et%20al%20(2008)_PBR.pdf"
            , "https://psycnet.apa.org/index.cfm?fa=search.searchResults"
            , "https://psycnet.apa.org/record/1982-13030-001"
            , "https://publicdomainreview.org/essay/emma-willard-maps-of-time/"
            , "https://public.tableau.com/app/profile/jurijfedorov#!/vizhome/AnthropologysScienceWars/Field"
            , "https://pubmed.ncbi.nlm.nih.gov/8588288/"
            , "https://pubs.acs.org/doi/abs/10.1021/es0719071"
            , "https://pubs.aeaweb.org/doi/pdfplus/10.1257/aer.91.5.1539"
            , "https://pubs.aip.org/physicstoday/Online/4628/The-war-over-supercooled-water"
            , "https://pubsonline.informs.org/doi/suppl/10.1287/mnsc.2018.3032/suppl_file/mnsc.2018.3032-sm.pdf"
            , "https://pulitzercenter.org/stories/right-not-know-when-ignorance-bliss-deadly"
            , "https://pure.au.dk/portal/en/publications/low-risk-of-suicide-and-lithium-in-drinking-water-a-danish-indivi"
            , "https://pure.tue.nl/ws/portalfiles/portal/142614149/J.R.Ubbink_09_09_2019_thesis_final.pdf"
            , "https://pure.uva.nl/ws/files/3216102/15320_Thesis.pdf#page=103"
            , "https://pure.uvt.nl/ws/portalfiles/portal/29125573/MTO_Flore_influence_of_gender_stereotype_CRiSP_2019.pdf#page=3"
            , "https://purse.io/"
            , "https://qa.debian.org/popcon.php?package=mnemosyne"
            , "https://qntm.org/invisibility"
            , "https://quadrant.org.au/magazine/uncategorized/eugenics-ready/"
            , "https://qualitysafety.bmj.com/content/21/10/819.abstract"
            , "https://quoteinvestigator.com/2012/12/30/yogi-didnt-say/"
            , "https://qz.com/1311732/openai-built-gaming-bots-that-can-work-as-a-team-with-inhuman-precision"
            , "https://rachelbythebay.com/"
            , "https://podcasts.apple.com/gb/podcast/episode-311-jerry-saltz-art-critic-at-new-york/id551088534"
            , "https://raw.githubusercontent.com/Riashat/Active-Learning-Bayesian-Convolutional-Neural-Networks/master/Presentations/Thesis/Islam%20Riashat%20MPhil%20MLSALT%20Thesis.pdf"
            , "https://rbej.biomedcentral.com/articles/10.1186/s12958-015-0029-9"
            , "https://rd.springer.com/chapter/10.1007/978-3-030-42504-3_15"
            , "https://readonlymemory.vg/shop/book/arcade-game-typography/"
            , "https://reason.com/2017/11/28/in-search-of-the-elusive-bitco/"
            , "https://repository.si.edu/bitstream/handle/10088/18355/nzp_changing_world_mcshea.pdf"
            , "https://repository.uel.ac.uk/download/489cc10ec6c30da0e7bbdfb33898364c46ac9dcc727169bd1850016053e45278/347037/2013_Dawkins_e-cig_survey.pdf"
            , "https://research.facebook.com/blog/2016/03/do-jobs-run-in-families/"
            , "https://reset.me/story/benefits-of-microdosing-with-lsd-and-psilocybin-mushrooms/"
            , "https://risk-engineering.org/concept/Rasmussen-practical-drift"
            , "https://ro.ecu.edu.au/cgi/viewcontent.cgi?article=1025&context=spsyc_pres"
            , "https://royalsocietypublishing.org/doi/10.1098/rsos.170988"
            , "https://rpubs.com/EmilOWK/232493"
            , "https://rss.onlinelibrary.wiley.com/doi/full/10.1111/j.1740-9713.2006.00202.x"
            , "https://rstb.royalsocietypublishing.org/content/365/1537/73.full"
            , "https://runrepeat.com/height-evolution-in-the-nba"
            , "https://samsaffron.com/archive/2012/06/07/testing-3-million-hyperlinks-lessons-learned#comment-31366"
            , "https://scholar.google.com/scholar?q=cat%20earwax%20OR%20%22ear%20wax%22%20smell%20OR%20taste%20%2D%22CAT%20scan%22"
            , "https://scholar.harvard.edu/files/rpande/files/moving_isolation_aer_submission.pdf"
            , "https://scienceblogs.com/cognitivedaily/2009/04/16/a-quick-eye-exercise-can-impro"
            , "https://science.nasa.gov/science-news/science-at-nasa/2005/03jun_naps/"
            , "https://scp-wiki.wikidot.com/scp-988"
            , "https://searchengineland.com/google-alerts-arent-working-148642"
            , "https://flickr.com/photos/michellemaabelle/4630940195/"
            , "https://sembr.org/"
            , "https://sensebridge.net/projects/northpaw/"
            , "https://sethroberts.net/2011/01/29/the-buttermind-experiment/"
            , "https://ssgac.org/documents/CHIC_Summary_Benyamin2014.txt.gz"
            , "https://sgo.sagepub.com/content/5/2/2158244015579724"
            , "https://shs.hal.science/halshs-02180182/document"
            , "https://siepr.stanford.edu/system/files/shared/Final_Rosston_Savage_Waldman_02_04_10__1_.pdf"
            , "https://sites.google.com/view/mend-editing"
            , "https://sites.google.com/view/multi-agent-competition"
            , "https://sites.research.google/trc/"
            , "https://sites.suffolk.edu/legaltech/2014/03/11/serious-an-lpti-supported-project-to-improve-students-learning-and-bar-performance/"
            , "https://sive.rs/srs"
            , "https://skeb.jp/"
            , "https://skeptics.stackexchange.com/questions/1700/do-bigger-or-more-monitors-increase-productivity/1701#1701"
            , "https://skift.com/oral-history-of-booking-acquisition/"
            , "https://slashdot.org/story/07/11/18/1319201/do-tiny-url-services-weaken-net-architecture"
            , "https://slate.com/articles/life/seed/2001/04/the_rise_of_the_smart_sperm_shopper.single.html"
            , "https://sociologicalscience.com/download/vol-6/april/SocSci_v6_219to234.pdf"
            , "https://soundcloud.com/leggysalad/girls-afternoon-appointments"
            , "https://spectrum.ieee.org/lasers-and-lunar-arks-cryopreservation-heats-up"
            , "https://spectrum.library.concordia.ca/id/eprint/36253/1/2010_Mining_Writeprints_from_Anonymous_E-mails.pdf"
            , "https://spreadsheets.google.com/ccc?key=rOfijmsJ-hxPbzmbi4dmHVg"
            , "https://journals.sagepub.com/doi/full/10.1177/0306312714535679"
            , "https://stability.ai/news/stable-diffusion-public-release"
            , "https://stackoverflow.com/questions/504823/has-anyone-actually-implemented-a-fibonacci-heap-efficiently"
            , "https://static-content.springer.com/esm/art%3A10.1186%2Fs12917-017-0987-6/MediaObjects/12917_2017_987_MOESM2_ESM.xlsx"
            , "https://stats.stackexchange.com/questions/9001/approximate-order-statistics-for-normal-random-variables/9010#9010"
            , "https://stats.stackexchange.com/users/2392/probabilityislogic"
            , "https://steamcommunity.com/groups/steamworks/announcements/detail/1697229969000435735"
            , "https://stevecoast.com/2015/03/27/the-world-will-only-get-weirder/"
            , "https://store.steampowered.com/app/497780/Recursed/"
            , "https://stripe.com/blog/negative-emissions-commitment"
            , "https://stroke.ahajournals.org/content/39/10/2824.full"
            , "https://studenttheses.universiteitleiden.nl/access/item%3A2608213/view"
            , "https://subs2srs.sourceforge.net/"
            , "https://substack.com/"
            , "https://subterraneanpress.com/magazine/fall_2013/the_truth_of_fact_the_truth_of_feeling_by_ted_chiang"
            , "https://summerofcode.withgoogle.com/"
            , "https://sundhedsdatastyrelsen.dk/da/404/?item=%2fda%2ftal-og-analyser%2fanalyser-og-rapporter%2fandre-analyser-og-rapporter%2fassisteret-reproduktion&user=extranet%5cAnonymous&site=sds"
            , "https://super.gluebenchmark.com/leaderboard/"
            , "https://super-memory.com/articles/theory.htm"
            , "https://superuser.com/questions/1633073/why-are-tar-xz-files-15x-smaller-when-using-pythons-tar-library-compared-to-mac"
            , "https://support.google.com/websearch/answer/2466433"
            , "https://support.mozilla.org/en-US/kb/firefox-page-info-window"
            , "https://support.torproject.org/"
            , "https://community.torproject.org/relay/"
            , "https://tails.net/"
            , "https://tasvideos.org/6347S"
            , "https://taylorandfrancis.com/"
            , "https://teahabitat.com/"
            , "https://tealet.com/"
            , "https://www.rescuetime.com/from/unbounce/for/teams"
            , "https://techcrunch.com/2013/02/23/the-chinese-are-coming-the-chinese-are-coming/"
            , "https://www.kaggle.com/models/google/gtr?tfhub-redirect=true"
            , "https://thecatsite.com/threads/my-cat-likes-earwax.69070/"
            , "https://thechineseteashop.com/"
            , "https://thecleverest.com/judgefakepeople/main.php?sort=highest"
            , "https://theconversation.com/intelligence-inheritance-three-genes-that-add-to-your-iq-score-31397"
            , "https://thecorrespondent.com/100/the-new-dot-com-bubble-is-here-its-called-online-advertising/13228924500-22d5fd24"
            , "https://theeagle.com/news/local/cc-world-s-first-cloned-cat-turns-years-old/article_d2aeac6e-2471-11ea-a5f2-7b6c21b2b4b4.html"
            , "https://thegradient.pub/understanding-evaluation-metrics-for-language-models/"
            , "https://theintercept.com/2016/08/03/gop-lawyer-chinese-owned-company-us-presidential-politics/"
            , "https://themorningnews.org/article/the-heretic"
            , "https://thenextweb.com/news/google-alerts-regains-rss-delivery-option-it-lost-after-google-readers-demise"
            , "https://thepiratebay.org/description.php?id=18368760"
            , "https://thesession.org/"
            , "https://thesocietypages.org/socimages/2008/02/06/correlations-of-iq-with-income-and-wealth/"
            , "https://www.thetakeout.com/inside-black-market-vintage-kool-aid-packet-collectors-1835123510/"
            , "https://thewest.com.au/news/wa/drug-warning-for-teens-ng-ya-353278"
            , "https://thiscardoesnotexist.glitch.me/"
            , "https://thisponydoesnotexist.net/model/network-ponies-1024-151552.pkl"
            , "https://www.thomasbarker.com/bitcoin-a-little-slice-of-future-shock/"
            , "https://thoughtbot.com/blog/arduino-bathroom-occupancy-detector"
            , "https://timarit.is/page/131542"
            , "https://timesofindia.indiatimes.com/city/bengaluru/peddlers-procuring-narcotics-from-dark-world-of-internet/articleshow/48368502.cms"
            , "https://tineye.com/"
            , "https://tl.net/blogs/286351-worker-rush-part-5-live-to-win?view=all"
            , "https://t.me/alexeyguzey"
            , "https://tobaccocontrol.bmj.com/content/14/1/49.full"
            , "https://today.yougov.com/politics/articles/37052-why-wont-americans-get-vaccinated-poll-data"
            , "https://top500.org/news/fugaku-holds-top-spot-exascale-remains-elusive/"
            , "https://towardsdatascience.com/gpt-3-creative-potential-of-nlp-d5ccae16c1ab"
            , "https://training.cochrane.org/handbook/current"
            , "https://trends.google.com/trends/explore?q=Long%20Bets"
            , "https://trialsjournal.biomedcentral.com/articles/10.1186/s13063-015-1080-8"
            , "https://tribune.com.pk/story/1967033/3-amid-animal-cruelty-debate-80-south-koreas-sniffer-dogs-cloned"
            , "https://truewetsuits.jp/travel_guide/tokyo_books_music/manga/Mangano-mori+Ikebukuro/1995"
            , "https://tuts4you.com/download.php?view.2348"
            , "https://tvtropes.org/pmwiki/pmwiki.php/VisualNovel/UminekoWhenTheyCry"
            , "https://tweelingenregister.vu.nl/gpc"
            , "https://x.com/advadnoun/status/1458894698974638111"
            , "https://x.com/search?f=tweets&q=http%3A%2F%2Fwww.thiswaifudoesnotexist.net&src=typd"
            , "https://type-r.hatenablog.com/entries/2012/12/05"
            , "https://ubc-emotionlab.ca/wp-content/uploads/2012/09/Schimmack-2012-Effect-of-Significance-on-Article-Credibility.pdf"
            , "https://uitspraken.rechtspraak.nl/inziendocument?id=ECLI:NL:RBMNE:2014:4792"
            , "https://uk.pi-supply.com/products/pijuice-solar?v=7516fd43adaa"
            , "https://undark.org/2016/05/25/the-death-of-a-study-national-childrens-study/"
            , "https://understandinguncertainty.org/what-does-13-increased-risk-death-mean"
            , "https://unesdoc.unesco.org/ark:/48223/pf0000220391"
            , "https://us-east-1.console.aws.amazon.com/ec2/v2/home?region=us-east-1#LaunchInstanceWizard:ami=ami-b36981d8"
            , "https://usesthis.com/"
            , "https://uva.theopenscholar.com/vcap/publications"
            , "https://variety.com/2017/digital/news/netflix-thumbs-vs-stars-1202010492/"
            , "https://vault.si.com/vault/2009/03/23/how-and-why-athletes-go-broke"
            , "https://vgl.ucdavis.edu/tests?field_species_target_id=216"
            , "https://vgmdb.net/product/9"
            , "https://vimeo.com/groups/45234/videos/11912761"
            , "https://vinecon.ucdavis.edu/wp-content/uploads/2019/04/cwe1201.pdf"
            , "https://vision-explorer.allenai.org/text_to_image_generation"
            , "https://vividness.live/protestant-buddhism"
            , "https://vizhub.healthdata.org/gbd-compare/#settings=0766b73db1d02f22ea6e150ced632f13345caaee"
            , "https://vk.com/alexeyguzey"
            , "https://vndb.org/c582"
            , "https://www.waifu2x.net/"
            , "https://waifulabs.com/blog/ax"
            , "https://wandb.ai/wandb_fc/gradient-dissent/reports/What-could-make-AI-conscious-with-Wojciech-Zaremba-co-founder-of-OpenAI--Vmlldzo3NDk3MDI"
            , "https://warosu.org/g/thread/69872559"
            , "https://wcfcourier.com/news/local/crime-and-courts/waterloo-man-pleads-guilty-to-selling-ecstacy/article_a57aab93-b9c5-5e3e-8438-6e229c9bd036.html"
            , "https://sd.llnl.gov/fac/site300/cff/index.html"
            , "https://web-archive-org.translate.goog/web/20070301005837/homepage3.nifty.com/kyrie/story26.html?_x_tr_sch=http&_x_tr_sl=ja&_x_tr_tl=en&_x_tr_hl=en-US"
            , "https://web-japan.org/trends00/honbun/tj010207.html"
            , "https://web.maths.unsw.edu.au/~jim/wrongthoughts.html"
            , "https://web.mit.edu/remy/"
            , "https://websitedownloader.io/"
            , "https://wellcomecollection.org/"
            , "https://wiki.evageeks.org/Episode_26%27#.22Last_B.22"
            , "https://swombat.com/2012/2/27/modafinil-and-startups"
            , "https://wordpress.org/plugins/broken-link-checker/"
            , "https://works.bepress.com/laura_stambaugh/6/download/"
            , "https://worksinprogress.co/issue/better-eats/"
            , "https://ww2.arb.ca.gov/our-work/programs/cap-and-trade-program"
            , "https://www.1001fonts.com/goudy-initialen-font.html"
            , "https://www.1m.co/details/drugs/45641/waklert-150-mg"
            , "https://www2.bfi.org.uk/films-tv-people/4ce2b707390e5"
            , "https://www.ed.gov/sites/ed/files/rschstat/eval/tech/evidence-based-practices/finalreport.pdf"
            , "https://www2.guidestar.org/profile/13-1624016"
            , "https://www.psy.uq.edu.au/~uqbziets/Mosing%20et%20al%202015%20Did%20sexual%20selection%20shape%20human%20music.pdf"
            , "https://www3.ntu.edu.sg/czzhao/iq/test.htm"
            , "https://www.4nrx-uk.md/general-health/modalert-modafinil.html"
            , "https://www.aaai.org/ocs/index.php/WS/AAAIW17/paper/viewFile/15205/14661"
            , "https://www.abbiotec.com/proteins/human-ngf-beta"
            , "https://www.abc10.com/news/article/251775/2/Cross-county-drug-ring-using-dark-Internet-site-busted-by-feds"
            , "https://www.abc.net.au/news/2015-01-07/charlie-hebdo-satirical-newspaper-shooting-paris-12-killed/6005524"
            , "https://www.abebooks.com/"
            , "https://www.academia.edu/24382120"
            , "https://www.acpjournals.org/doi/10.7326/0003-4819-152-11-201006010-00232?articleid=745807"
            , "https://www.acpjournals.org/doi/10.7326/M19-1326"
            , "https://www.actionnewsnow.com/news/durham-couple-indicted-as-part-of-silk-road-2-0-crackdown/"
            , "https://www.adafruit.com/product/328"
            , "https://www.advrider.com/f/threads/seattle-to-argentina-on-a-klr650.136505/"
            , "https://www.aeaweb.org/conference/2016/retrieve.php?pdfid=14392&tk=y2EF5G29"
            , "https://www.aei.org/publication/abolish-the-sat-2/"
            , "https://www.aera.net/Research-Policy-Advocacy/AERA-Shaping-Research-Policy"
            , "https://www.afp.gov.au/media-centre/news/afp/2015/may/four-australians-charged-in-international-illegal-firearm-sting"
            , "https://www.afr.com/technology/ernst--young-16-million-bitcoin-auction-20160527-gp53i0"
            , "https://www.agriculture.gov.au/biosecurity-trade/cats-dogs/frequently-asked-questions"
            , "https://www.ahajournals.org/doi/abs/10.1161/circ.120.suppl_18.S461-a"
            , "https://www.ahajournals.org/doi/full/10.1161/01.cir.94.5.878"
            , "https://www.aiwriter.email/"
            , "https://www.ajmadison.com/cgi-bin/ajmadison/ACQ189XS.html"
            , "https://www.ajnr.org/content/33/1/49.full"
            , "https://www.alchemistowl.org/arrigo/Papers/Arrigo-Triulzi-PACSEC08-Project-Maux-II.pdf"
            , "https://www.alphagomovie.com/#deepmind"
            , "https://www.alternatehistory.com/forum/threads/victoria.10/"
            , "https://www.alzchem.com/de/"
            , "https://www.alzforum.org/news/research-news/preimplantation-genetic-diagnosis-its-no-walk-park"
            , "https://www.ama-assn.org/"
            , "https://www.amazon.co.jp/%E7%B4%85%E4%B8%80%E7%82%B9%E8%AB%96%E2%80%95%E3%82%A2%E3%83%8B%E3%83%A1%E3%83%BB%E7%89%B9%E6%92%AE%E3%83%BB%E4%BC%9D%E8%A8%98%E3%81%AE%E3%83%92%E3%83%AD%E3%82%A4%E3%83%B3%E5%83%8F-%E3%81%A1%E3%81%8F%E3%81%BE%E6%96%87%E5%BA%AB-%E6%96%8E%E8%97%A4-%E7%BE%8E%E5%A5%88%E5%AD%90/dp/4480036660"
            , "https://www.amazon.com/Watamote-Complete-Collection-Blu-ray/dp/B00JXBLM72/"
            , "https://www.ams.org/notices/200605/fea-lang.pdf#page=12"
            , "https://www.anandtech.com/show/12535/power-outage-at-samsungs-fab-destroys-3-percent-of-global-nand-flash-output"
            , "https://www.angelfire.com/anime4/mdwigs/livesequence.html"
            , "https://www.animenewsnetwork.com/encyclopedia/company.php?id=14634"
            , "https://www.anime-planet.com/anime/years/1992"
            , "https://www.annualreviews.org/doi/10.1146/annurev-psych-010416-044022"
            , "https://www.antonhowes.com/"
            , "https://www.apa.org/monitor/2011/09/achievement"
            , "https://www.arkansasonline.com/news/2019/nov/28/airport-beagles-sniff-out-illicit-foods/"
            , "https://www.arknights.global/"
            , "https://www.army.mil/article/56965/military_working_dogs_guardians_of_the_night"
            , "https://www.artbreeder.com/"
            , "https://www.artofmanliness.com/character/manly-lessons/the-churchill-school-of-adulthood-lesson-2-establish-a-daily-routine/"
            , "https://www.arxiv-vanity.com/"
            , "https://www.atlasobscura.com/articles/what-bread-did-ancient-egyptians-eat"
            , "https://www.atsjournals.org/doi/full/10.1164/ajrccm.162.3.9908040"
            , "https://www.avalonmagicplants.com/health/drug-test/en-cool-stuff-ez-drug-test-lsd"
            , "https://www.avclub.com/ducktales-invented-a-new-animated-wonderland-that-quick-1798236288"
            , "https://www.backblaze.com/blog/hard-drive-cost-per-gigabyte/"
            , "https://baltcoffee.com/catalog/loose-tea-ribbon-bags/"
            , "https://www.barnesandnoble.com/"
            , "https://www.barnstormjournal.org/poetry/the-river-bridge/"
            , "https://www.bbc.com/news/health-35262535"
            , "https://www.bbc.com/news/uk-england-35690394"
            , "https://www.beelinereader.com/"
            , "https://www.behance.net/gallery/35437979/Velocipedia"
            , "https://www.belfastlive.co.uk/news/belfast-news/northern-ireland-men-jailed-over-9147435"
            , "https://www.ben-evans.com/benedictevans/2016/4/28/winning-and-losing"
            , "https://www.berkshireeagle.com/ci_26681481/former-bard-college-at-simons-rock-student-avoids/"
            , "https://www.berkshirehathaway.com/letters/letters.html"
            , "https://www.berlin.de/polizei/polizeimeldungen/pressemitteilung.261025.php"
            , "https://www.betterworldbooks.com/"
            , "https://www.bfi.org/about-bucky/resources/books/grunch-giants/foreword"
            , "https://www.bfmtv.com/police-justice/info-bfmtv-loire-un-cyberdealer-interpelle-premiere-en-france_AN-201312260067.html"
            , "https://www.biorxiv.org/content/10.1101/274654.full"
            , "https://www.birminghammail.co.uk/news/midlands-news/man-who-bought-glock-pistol-11538095"
            , "https://www.bizjournals.com/albany/stories/2010/01/11/focus2.html?page=all"
            , "https://www.blender.org/user-stories/japanese-anime-studio-khara-moving-to-blender/"
            , "https://www.blockchain.com/explorer/addresses/btc/1AZvaBEJMiK8AJ5GvfvLWgHjWgL59TRPGy"
            , "https://www.blockchain.com/explorer/transactions/btc/4e4364800426f6d601afeb1d1f34f1b93c6e599e7cb6e496416958a3364630bf"
            , "https://www.bloomberg.com/businessweek/ap/financialnews/D9KQL7CG0.htm"
            , "https://www.bloomberg.com/opinion/articles/2017-05-03/why-i-lost-my-bet-with-warren-buffett"
            , "https://www.bls.gov/opub/mlr/2016/article/the-life-of-american-workers-in-1915.htm"
            , "https://www.bmj.com/content/361/bmj.K2270"
            , "https://www.bnlearn.com/"
            , "https://www.brandonsanderson.com/blogs/blog/sandersons-first-law"
            , "https://www.broadinstitute.org/news/broad-institute-sequences-its-100000th-whole-human-genome-national-dna-day"
            , "https://www.bulletproof.com/why-you-are-suffering-from-a-modafinil-deficiency/"
            , "https://www.businessinsider.com/deepfake-tech-create-fictitious-faces-cats-airbnb-listings-2019-2"
            , "https://www.businessinsider.jp/post-185786"
            , "https://www.businesswire.com/news/home/20171121005280/en/Amazon-Celebrates-10th-Holiday-Season-Frustration-Free-Packaging"
            , "https://www.buzzfeed.com/joshdean/are-we-warming-up-to-cryonics"
            , "https://www.buzzfeednews.com/article/justinesharrock/whats-wrong-with-google-alerts"
            , "https://www.bvp.com/anti-portfolio"
            , "https://www.cabinetmagazine.org/issues/42/wiles.php"
            , "https://www.cambridge.org/core/journals/journal-of-economic-history/article/two-centuries-of-productivity-growth-in-computing/856EC5947A5857296D3328FA154BA3A3"
            , "https://www.cambridge.org/core/journals/the-british-journal-of-psychiatry"
            , "https://www.campbellrivermirror.com/news/257558681.html"
            , "https://www.cancer.gov/about-cancer/causes-prevention/risk/tobacco/smokeless-fact-sheet#q2"
            , "https://www.cancerresearchuk.org/about-us"
            , "https://www.carolinacoastonline.com/news_times/article_87cc5f2c-3e8d-11e4-84f2-338083e94e20.html"
            , "https://www.cato.org/sites/cato.org/files/pubs/pdf/pa-298.pdf"
            , "https://www.cebm.ox.ac.uk/resources/ebm-tools/critical-appraisal-tools"
            , "https://www.cell.com/cell-genomics/fulltext/S2666-979X(22)00063-5"
            , "https://www.cell.com/iscience/fulltext/S2589-0042(21)00473-9"
            , "https://www.census.gov/newsroom/releases/archives/income_wealth/cb11-157.html"
            , "https://www.change.org/p/google-keep-google-reader-running"
            , "https://www.channel4.com/news/drugs-dark-web-atlantis-silk-road-police-fbi"
            , "https://www.chathamstartribune.com/news/article_92645de2-c7ed-11e4-8649-679fa666eaf8.html"
            , "https://www.chemistryworld.com/features/step-by-step-synthesis-of-dna/3008753.article"
            , "https://www.chessclub.com/ucc"
            , "https://www.chess.com/article/view/how-rybka-and-i-tried-to-beat-the-strongest-chess-computer-in-the-world"
            , "https://www.chicagobooth.edu/review/what-success-rock-climbing-tells-us-about-economic-growth"
            , "https://www.chinafile.com/library/nyrb-china-archive/chinese-shadows-bureaucracy-happiness-history"
            , "https://www.chronicle.com/article/google-begins-to-scale-back-its-scanning-of-books-from-university-libraries/"
            , "https://www.churchofjesuschrist.org/study/scriptures/dc-testament/dc/121?lang=eng&id=45"
            , "https://www.cisco.com/c/en/us/obsolete/routers/cisco-7505-router.html"
            , "https://www.citizenaudit.org/"
            , "https://www.city-journal.org/article/it-hurts-therefore-i-am"
            , "https://www.clippershipteaco.com/"
            , "https://www.americanspa.com/fitness-studies/ihrsa-reports-57-million-health-club-members-27-6-billion-industry-revenue-2016"
            , "https://www.cmajopen.ca/content/2/2/E69.full"
            , "https://www.cnbc.com/2018/03/23/elon-musk-spacex-and-tesla-were-two-of-the-dumbest-business-ideas.html"
            , "https://wwwcn.cs.uni-duesseldorf.de/publications/publications/library/Jerschow2010a.pdf"
            , "https://www.cnet.com/13506_3-20040008-17.html"
            , "https://www.cochranelibrary.com/doi/10.1002/14651858.CD008661/full"
            , "https://www.codespaces.com/power-searching-with-google.html"
            , "https://www.comicconnect.com/item/916042"
            , "https://www.computerworld.com/article/1369965/is-history-repeating-itself-with-antitrust-battle.html"
            , "https://www.consumerlab.com/reviews/melatonin-supplements/melatonin/"
            , "https://copenhagenconsensus.com/publication/second-copenhagen-consensus-micronutrient-supplements-child-survival-best-practice"
            , "https://www.copyright.gov/comp3/chap300/ch300-copyrightable-authorship.pdf#Compendium%20300.indd%3A.122046%3A96431"
            , "https://www.counterpunch.org/2009/03/24/the-most-dangerous-person-in-the-world/"
            , "https://www.coursera.org/learn/probabilistic-graphical-models"
            , "https://www.courtlistener.com/docket/4353251/united-states-v-ulbricht/"
            , "https://www.courtlistener.com/docket/4367922/apotex-inc-v-cephalon-inc/"
            , "https://www.courts.mo.gov/cnet/welcome.do"
            , "https://www.courts.sa.gov.au/SentencingRemarks/Pages/lightbox.aspx?IsDlg=1&Filter=4029"
            , "https://www.cracked.com/article_19497_6-terrifying-things-nobody-tells-you-about-donating-sperm.html"
            , "https://www.cram.com/"
            , "https://www.crd.york.ac.uk/prospero/display_record.php?RecordID=85216"
            , "https://www.csail.mit.edu/news/programmers-solve-mits-20-year-old-cryptographic-puzzle"
            , "https://www.cs.purdue.edu/homes/pfonseca/papers/eurosys2017-dsbugs.pdf"
            , "https://www.csub.edu/~mdulcich/documents/diffusion_of_responsibility.pdf"
            , "https://www.cs.utexas.edu/~EWD/transcriptions/EWD05xx/EWD594.html"
            , "https://www.cs.york.ac.uk/research//ART/download.html"
            , "https://www.dailystar.co.uk/news/weird-news/billionaires-cloned-dog-saves-lives-20895267"
            , "https://www.dantelabs.com/products/whole-genome-sequencing"
            , "https://www.darkowl.com/blog-content/darknet-whackamole/"
            , "https://www.dea.gov/druginfo/ftp3.shtml"
            , "https://deepmind.google/discover/blog/agents-that-imagine-and-plan/"
            , "https://www.delawareonline.com/story/news/local/2015/01/13/doctor-sentenced-months-silk-road-drug-case/21716135/"
            , "https://www.derekau.net/this-vessel-does-not-exist"
            , "https://www.designboom.com/technology/evolution-desk-harvard-innovation-lab-09-30-2014/"
            , "https://www.detectiveconanworld.com/wiki/The_Last_Wizard_of_the_Century#Situation"
            , "https://www.devever.net/~hl/growupdown"
            , "https://www.deviantart.com/tootootaloo/art/Celestia-Vector-212081002"
            , "https://www.dharmaoverground.org/dharma-wiki/-/wiki/Main/MCTB/en"
            , "https://www.dichtbij.nl/woerden/regionaal-nieuws/artikel/3731781/woerdenaar-47-voor-5-jaar-de-cel-in-voor-drugshandel-en-opdracht-tot-moord.aspx"
            , "https://www.discovermagazine.com/planet-earth/brain-training-games-get-a-d-at-brain-training-tests"
            , "https://www.dr.dk/nyheder/indland/fbi-aktion-lukker-danske-narkohandlere-paa-nettet"
            , "https://www.dropbox.com/s/m748tqn9ypwiz0z/%E6%9D%B1%E6%96%B9%E7%88%86%E9%9F%B3%E3%82%B8%E3%83%A3%E3%82%BA4-%E4%BB%A4%E7%9E%91%E3%82%B3%E3%83%89%E9%9B%B6.ogg"
            , "https://www.drugs.com/dosage/metformin.html"
            , "https://www.drugsdata.org/faq.php"
            , "https://www.dummy-system.com/2013/04/23/intervista-a-maaya-sakamoto-su-evangelion-3-0/"
            , "https://www.duolingo.com/"
            , "https://www.ebay.com/itm/251266500210"
            , "https://www.ebay.co.uk/itm/48-LED-illuminator-light-CCTV-IR-Infrared-Night-Vision-/180410200537"
            , "https://genscot.ed.ac.uk/"
            , "https://www.edge.org/conversation/robert_plomin-why-were-different"
            , "https://www.eetimes.com/darpa-unveils-100m-eda-project/"
            , "https://www.ejlt.org/index.php/ejlt/article/view/320/424"
            , "https://www.elastic.co/blog/why-license-change-aws"
            , "https://www.emacswiki.org/emacs/MarkdownMode"
            , "https://www.euda.europa.eu/publications/posters/2018/darknet-markets-ecosystem_en"
            , "https://www.energy.gov/node/2518899"
            , "https://www.engadget.com/2010-09-18-intel-wants-to-charge-50-to-unlock-stuff-your-cpu-can-already-d.html"
            , "https://www.english.upenn.edu/people/paul-korshin"
            , "https://www.enworld.org/threads/dungeons-ponies-at-last.664106/"
            , "https://www.equilibretechnologies.com/"
            , "https://www.eric.ed.gov/ERICWebPortal/custom/portlets/recordDetails/detailmini.jsp?_nfpb=true&_&ERICExtSearch_SearchValue_0=EJ724232&ERICExtSearch_SearchType_0=no&accno=EJ724232"
            , "https://www.erowid.org/"
            , "https://pure.manchester.ac.uk/ws/portalfiles/portal/54552919/FULL_TEXT.PDF#page=137"
            , "https://www.esquire.com/news-politics/a20903/hugh-hefner-interview-0413/"
            , "https://www.eurekalert.org/news-releases/636717"
            , "https://www.eurojust.europa.eu/press/PressReleases/Pages/2014/2014-11-07.aspx"
            , "https://www.expressandstar.com/news/local-news/2016/05/30/gun-importer-told-to-reveal-why-he-ordered-weapon-online/"
            , "https://www.express.co.uk/news/uk/44940/Caribbean-island-where-red-haired-locals-speak-with-Scottish-accent"
            , "https://www.facebook.com/permalink.php?story_fbid=224735391342335&id=100014176268390"
            , "https://www.fanfiction.net/s/5588986/1/"
            , "https://www.fastcompany.com/90659827/the-bootleg-fire-is-burning-through-trees-that-are-being-used-as-carbon-offsets"
            , "https://www.fda.gov/news-events/press-announcements/fda-approves-first-oral-glp-1-treatment-type-2-diabetes"
            , "https://www.fightaging.org/archives/2011/05/more-on-body-temperature-and-calorie-restriction/"
            , "https://www.fightaging.org/archives/2018/09/thoughts-on-attending-raadfest-2018-in-san-diego/"
            , "https://www.fimfiction.net/story/62074/Friendship-is-Optimal"
            , "https://www.fincen.gov/news/news-releases/fincen-awards-recognize-partnership-between-law-enforcement-and-financial"
            , "https://www.findagrave.com/memorial/7333144/john-von_neumann"
            , "https://www.firstthings.com/article/2019/12/notes-on-summer-camp"
            , "https://www.flashback.org/sp50195930"
            , "https://www.flashgamehistory.com/"
            , "https://www.flickr.com/groups/wiredsky/pool/"
            , "https://www.foliosociety.com/usa/the-book-of-the-new-sun.html"
            , "https://www.fool.com/investing/general/2014/12/12/122-things-everyone-should-know-about-investing-an.aspx"
            , "https://www.forbes.com/sites/andygreenberg/2013/11/07/sting-operation-nabs-alleged-online-arms-dealer-via-silk-road-competitor-site/"
            , "https://www.fordfoundation.org/wp-content/uploads/2016/07/roads-and-bridges-the-unseen-labor-behind-our-digital-infrastructure.pdf"
            , "https://www.foreignaffairs.com/middle-east/business-habits-highly-effective-terrorists?page=show"
            , "https://www.fox6now.com/news/brookfield-man-faces-multiple-charges-related-to-drugs-trafficking"
            , "https://www.foxcarolina.com/story/28631102/teen-arrested-after-allegedly-buying-lsd-online/"
            , "https://www.foxnews.com/world/germany-3-charged-for-illegally-making-selling-firearms"
            , "https://www.frbsf.org/economic-research/wp-content/uploads/sites/4/wp2017-25.pdf"
            , "https://www.freehaven.net/anonbib/topic.html"
            , "https://www.frontiersin.org/journals/endocrinology/articles/10.3389/fendo.2019.00845/full"
            , "https://www.fs.fed.us/rm/pubs_journals/2000/rmrs_2000_mcdaniel_g001.pdf"
            , "https://www.fsigenetics.com/article/S1872-4973(18)30248-5/fulltext"
            , "https://www.ftc.gov/reports/new-drug-development-estimating-entry-human-clinical-trials"
            , "https://www.garda.ie/en/about-us/our-departments/office-of-corporate-communications/press-releases/2014/november/-darknet-drug-seizure-dublin-5th-nov-2014.html"
            , "https://www.genome.gov/about-genomics/fact-sheets/DNA-Sequencing-Costs-Data"
            , "https://www.genwaybio.com/recombinant-human-beta-ngf"
            , "https://www.girlschase.com/content/how-have-sex-asian-girls"
            , "https://www.girlscouts.org/en/cookies/how-to-buy-cookies/cookies-frequently-asked-questions.html#bestselling"
            , "https://www.gitcoin.co/blog/gitcoin-grants-clr-matching"
            , "https://www.globaltimes.cn/content/1161960.shtml"
            , "https://www.global.toshiba/ww/news/corporate/2010/07/pr1401.html"
            , "https://www.gnu.org/software/emacs/manual/html_node/emacs/Keyboard-Macro-Counter.html"
            , "https://www.goodreads.com/interviews/show/21.Malcolm_Gladwell"
            , "https://www.goodtherapy.org/blog/natural-lighting-increases-productivity-0104112/"
            , "https://www.google.com/reviews/w"
            , "https://www.goproblems.com/"
            , "https://www.gov.uk/government/news/phe-publishes-independent-expert-e-cigarettes-evidence-review"
            , "https://www.greenexercise.org/"
            , "https://www.gsb.stanford.edu/insights/itamar-simonson-what-makes-people-collect-things"
            , "https://www.guilford.com/books/Handbook-of-Psychopathy/Christopher-Patrick/9781462541232"
            , "https://www.hakalalabs.com/testing.html"
            , "https://www.hanselman.com/blog/everythings-broken-and-nobodys-upset"
            , "https://www.harney.com/products/organic-green-with-citrus-ginkgo"
            , "https://www.harvardmagazine.com/2012/02/twilight-of-the-lecture"
            , "https://www.haskell.org/cabal/"
            , "https://www.heraldnews.com/story/news/crime/2015/06/03/fall-river-police-intercept-package/34419316007/"
            , "https://www.highflightfoundation.org/"
            , "https://onlinelibrary.wiley.com/doi/10.1155/2018/5121540"
            , "https://www.hindustantimes.com/punjab/financial-fraud-punjab-cops-brush-with-darknet-bitcoins/story-w4YDmUJFDgkV12scPzWWxO.html"
            , "https://www.history.com/news/how-portraiture-shaped-royal-marriages"
            , "https://www.historytoday.com/archive/feature/heads-will-roll"
            , "https://www.hoover.org/publications/policy-review"
            , "https://www.hrw.org/news/2017/10/22/china-voice-biometric-collection-threatens-privacy"
            , "https://www.htrnews.com/story/news/local/2015/03/10/man-arrested-marijuana-shipments-two-rivers/24694327/"
            , "https://www.huffpost.com/entry/photographs-redheads-of-color_n_55db9929e4b0a40aa3abf017"
            , "https://www.ibtimes.co.uk/dark-web-brixton-prison-worker-charged-trying-buy-glock-19-handgun-online-1546621"
            , "https://www.ice.gov/doclib/news/releases/2013/131107baltimore1.pdf"
            , "https://www.idnes.cz/brno/zpravy/bitcoiny-jihomoravska-policie-rozhovor.A160816_2266665_brno-zpravy_krut"
            , "https://www.ietf.org/rfc/rfc5005.txt"
            , "https://www.iflscience.com/man-creates-traffic-jams-by-wheeling-around-99-cell-phones-in-a-trailer-54902"
            , "https://www.iherb.com/pr/now-foods-kelp-150-mcg-200-tablets/685"
            , "https://www.illumina.com/content/dam/illumina-marketing/documents/products/brochures/datasheet_omni_whole-genome_arrays.pdf"
            , "https://www.imagesco.com/catalog/DigitalCompass/DigitalCompass.html"
            , "https://www.imdb.com/name/nm0663050/bio/"
            , "https://www.imf.org/~/media/Files/Publications/WP/2018/wp18268.ashx#pdf"
            , "https://www.impactcybertrust.org/dataset_view?idDataset=812"
            , "https://www.inc.com/minda-zetlin/netflix-blockbuster-meeting-marc-randolph-reed-hastings-john-antioco.html"
            , "https://www.independent.co.uk/news/uk/home-news/smile-a-perfect-smile-but-don-t-laugh-we-have-officially-lost-our-dentures-1336158.html"
            , "https://www.industrydocuments.ucsf.edu/tobacco/docs/#id=ssnl0112"
            , "https://www.infoplease.com/us/government/elections/presidential-election-of-2008-electoral-and-popular-vote-summary"
            , "https://www.informit.com/articles/article.aspx?p=2213858"
            , "https://www.insidehighered.com/news/2010/05/25/science"
            , "https://www.instagram.com/nathanwpylestrangeplanet/"
            , "https://www.instructables.com/Low-power-doorwindow-sensor/"
            , "https://www.intel.com/pressroom/archive/releases/2007/20071025corp.htm"
            , "https://www.inverse.com/input/culture/secretly-vibrant-world-of-audio-porn-mp3s"
            , "https://www.ioccc.org/2000/bellard.hint"
            , "https://www.irishcentral.com/news/the-secret-irishman-likely-behind-bitcoin-the-internet-currency-code-131039168-237415801"
            , "https://www.irishexaminer.com/news/arid-30650036.html"
            , "https://www.irishtimes.com/news/let-s-be-clear-i-didn-t-invent-bitcoin-1.614532"
            , "https://www.irrodl.org/index.php/irrodl/article/view/1928/3131"
            , "https://www.ivfbabble.com/on-the-40th-anniversary-of-the-first-ivf-in-the-usa-the-first-baby-elizabeth-jordan-carr-looks-at-how-science-today-has-produced-a-new-world-first-baby-aurea/"
            , "https://www.jacc.org/doi/10.1016/j.jcin.2015.01.039"
            , "https://www.jackkinsella.ie/articles/autodidactism"
            , "https://www.jameslindlibrary.org/articles/inventing-the-randomized-double-blind-trial-the-nurnberg-salt-test-of-1835/"
            , "https://www.janelia.org/project-team/flyem/hemibrain"
            , "https://www.japantimes.co.jp/news/2017/09/12/national/social-issues/1-20-infants-born-vitro-fertilization-japan-survey/"
            , "https://www.jetbrains.com/lp/mono/"
            , "https://www.jneurosci.org/content/jneuro/22/9/3656.full.pdf"
            , "https://www.jstage.jst.go.jp/article/nikkashi1948/90/6/90_6_507/_pdf"
            , "https://www.jstatsoft.org/index.php/jss/article/download/v048i09/601"
            , "https://www.jstatsoft.org/index.php/jss/article/download/v048i10/602"
            , "https://www.jstor.org/stable/10.1086/468061"
            , "https://www.justice.gov/usao-edca/press-release/file/918811/dl"
            , "https://www.jwz.org/blog/2004/03/when-the-database-worms-eat-into-your-brain/"
            , "https://www.kadokawa.co.jp/product/201012000009/"
            , "https://www.kaggle.com/datasets/ultrajack/modern-renaissance-poetry"
            , "https://www.kctv5.com/story/28250778/kansas-city-man-accused-of-possessing-35000-prescription-pills/"
            , "https://www.kgw.com/news/Wash-county-tactical-police-conducting-3-dawn-raids-236190011.html"
            , "https://www.khara.co.jp/hideakianno/personal-biography/"
            , "https://www.kickstarter.com/projects/upperstory/spintronics-build-mechanical-circuits"
            , "https://www.kokos.cz/bradkoun/movies/8mm.txt"
            , "https://www.kptv.com/story/15084456/battle-ground-schools-let-students-sleep-in/"
            , "https://www.labone.tech/anime-generative-model-part-3"
            , "https://www.lanl.gov/bdit/html/projects/AHF.htm"
            , "https://www.laphamsquarterly.org/future/trust-issues"
            , "https://www.latimes.com/archives/blogs/the-big-picture/story/2010-05-03/why-do-korean-moviegoers-get-to-see-iron-man-2-way-ahead-of-japan"
            , "https://www.latimes.com/archives/la-xpm-2001-aug-15-fo-34311-story.html"
            , "https://www.law.cornell.edu/uscode/text/10/520"
            , "https://www.lef.org/Vitamins-Supplements/Item01602/Neuro-Mag-Magnesium-L-Threonate-with-Calcium-and-Vitamin-D3.html"
            , "https://www.lemonde.fr/pixels/visuel/2015/03/06/google-memorial-le-petit-musee-des-projets-google-abandonnes_4588392_4408996.html"
            , "https://www.leontiadis.info/NLeontiadisEPP2014.pdf"
            , "https://www.liebertpub.com/doi/10.1089/hs.2021.0083"
            , "https://www.liebertpub.com/doi/abs/10.1089/neu.2016.4846"
            , "https://www.lightspeedmagazine.com/fiction/exhalation/"
            , "https://www.limeadery.com/"
            , "https://www.linode.com/"
            , "https://www.l-iz.de/leben/faelle-unfaelle/2015/03/leipziger-ermittler-nehmen-drogenversand-shiny-flakes-hoch-78227"
            , "https://www.loc.gov/collections/edison-company-motion-pictures-and-sound-recordings/about-this-collection/#vocal"
            , "https://www.longecity.org/forum/topic/54856-modafinil-use-prosecution-convictions/"
            , "https://www.loudountimes.com/news/drug-charges-dropped-against-prominent-leesburg-businessman/article_4fd16e3f-53f7-547e-94fd-8183cc465f75.html"
            , "https://www.lrb.co.uk/the-paper/v27/n17/steven-shapin/what-did-you-expect"
            , "https://www.lshtm.ac.uk/ncdeu/currentresearch/researchprojects/bwhhs/"
            , "https://www.lyrn.ai/2018/12/26/a-style-based-generator-architecture-for-generative-adversarial-networks/"
            , "https://maa.org/sites/default/files/images/images/upload_library/22/Polya/07468342.di020715.02p0066x.pdf"
            , "https://www.macrumors.com/2011/09/08/apple-institutes-new-charitable-matching-program-for-employees/"
            , "https://www.madboa.com/geek/gpg-quickstart/"
            , "https://www.manchestereveningnews.co.uk/news/greater-manchester-news/montgomery-byrne-jailed-dark-web-10743557"
            , "https://www.mangaupdates.com/series.html?id=2701"
            , "https://www.mansfieldnewsjournal.com/story/news/local/2015/03/11/court-hole-wall-suspects-tough-luck/70152120/"
            , "https://www.marxists.org/reference/archive/hegel/works/nl/ch03.htm"
            , "https://www.mathematica.org/-/media/publications/pdfs/nonexperimentalreps.pdf"
            , "https://www.mayoclinic.org/drugs-supplements/metformin-oral-route/proper-use/drg-20067074"
            , "https://www.mayoclinicproceedings.org/article/S0025-6196%2813%2900405-9/fulltext"
            , "https://www.mcsweeneys.net/articles/back-from-yet-another-globetrotting-adventure-indiana-jones-checks-his-mail-and-discovers-that-his-bid-for-tenure-has-been-denied"
            , "https://www.mdpi.com/2073-4425/11/6/648"
            , "https://www.mdpi.com/2076-2615/13/9/1528"
            , "https://www.mdpi.com/2073-4409/10/7/1740/htm"
            , "https://www.medicaldaily.com/psychologists-discover-how-people-subconsciously-become-their-favorite-fictional-characters-240435"
            , "https://www.medicines.org.uk/emc/medicine/23244/SPC"
            , "https://www.megaverse.info/"
            , "https://www.mercatus.org/emergent-ventures"
            , "https://www.mesacc.edu/~thoqh49081/handouts/talmudpage.html"
            , "https://www.metaculus.com/questions/"
            , "https://www.mha.gov.sg/"
            , "https://www.mhlw.go.jp/english/database/db-hw/report/5.html"
            , "https://www.microsoft.com/en-us/research/blog/zero-2-deepspeed-shattering-barriers-of-deep-learning-speed-scale/"
            , "https://millionshort.com/"
            , "https://www.mining.com/fifty-killed-in-a-knife-attack-at-a-chinese-colliery/"
            , "https://www.mirror.co.uk/news/uk-news/man-jailed-trying-smuggle-550000-3592428"
            , "https://www.mja.com.au/journal/1999/171/9/iodine-deficiency-ambulatory-participants-sydney-teaching-hospital-australia"
            , "https://www.mobihealthnews.com/20772/exclusive-sleep-coach-company-zeo-is-shutting-down/"
            , "https://www.moma.org/interactives/exhibitions/2012/inventingabstraction/?work=42"
            , "https://www.morinaga.co.jp/in/jelly/"
            , "https://www.slmath.org/workshops/220"
            , "https://www.muckrock.com/news/archives/2014/feb/03/dea-parallel-construction-guides/"
            , "https://www.t26.com/fonts/22320-Hangulatin-EN"
            , "https://www.nationaldefensemagazine.org/articles/2006/3/31/2006april--soldiers-marines-team-up-in-trailblazer-patrols"
            , "https://www.nato.int/docu/review/articles/2008/04/08/is-counterterrorism-good-value-for-money/index.html"
            , "https://www.nature.com/articles/s41366-021-00894-3"
            , "https://www.nba.com/news/takeaways-2018-19-nba-roster-survey"
            , "https://www.nber.org/papers/w13711"
            , "https://www.nbr.co.nz/article/chch-man-sentenced-after-buying-amazon-illegal-drugs-website-ck-135659"
            , "https://www.ncbi.nlm.nih.gov/pmc/articles/PMC4959137/"
            , "https://www.ncbi.nlm.nih.gov/pmc/articles/PMC6167335/"
            , "https://www.ndss-symposium.org/wp-content/uploads/2019/02/ndss2019_02B-5_Wampler_paper.pdf"
            , "https://www.nearlyfreespeech.net/"
            , "https://www.nejm.org/doi/full/10.1056/NEJMoa1511939"
            , "https://neuroscience.cam.ac.uk/publications/download.php?id=11205"
            , "https://www.newadvent.org/fathers/03061.htm"
            , "https://www.newegg.com/acer-america-aspire-v15-nitro-black-edition-15-6-nvidia-geforce-gtx-960m-intel-core-i7-4720hq-8gb-memory-1tb-hdd/p/N82E16834314849"
            , "https://www.newscientist.com/article/2133095-boom-in-human-gene-editing-as-20-crispr-trials-gear-up/"
            , "https://www.newstatesman.com/politics/uk-politics/2017/06/many-terrorists-first-victims-are-their-wives-were-not-allowed-talk-about"
            , "https://www.newsweek.com/i-cloned-my-dog-puppies-have-different-personalities-1674290"
            , "https://www.newyorker.com/magazine/2017/10/16/russias-house-of-shadows"
            , "https://www.newyorkfed.org/medialibrary/media/research/staff_reports/sr166.pdf"
            , "https://3quarksdaily.com/3quarksdaily/2013/04/researchers-finally-replicated-reinhart-rogoff-and-there-are-serious-problems.html"
            , "https://www.nicvape.com/store/p/48-1-liter-of-100-mg-ml.aspx"
            , "https://www.nimh.nih.gov/about/directors/thomas-insel/blog/2011/the-economics-of-health-care-reform"
            , "https://www.nitrd.gov/pubs/bluebooks/2001/asci.html"
            , "https://www.nlsinfo.org/content/cohorts/nlsy79-children"
            , "https://www.nngroup.com/articles/computer-skill-levels/"
            , "https://www.nobelprize.org/prizes/chemistry/2020/press-release/"
            , "https://www.nola.com/news/crime_police/article_bd297d74-f2e1-5c15-9db3-c96545f38688.html"
            , "https://www.northwestgeorgianews.com/road-check-leads-to-meth-charges-for-rome-woman/article_367ea18e-1532-11eb-92a7-cf0f8ab22367.html"
            , "https://krandi.notion.site/GPT3-Dataset-Task-Model-b97a267d6f5f44e688ba4f7ec85c00cc"
            , "https://www.nrdc.org/stories/nuclear-power-101"
            , "https://www.nsa.gov/news-features/press-room/Article/1630570/national-cryptologic-museum-opens-new-exhibit-on-dr-john-nash/"
            , "https://www.ntticc.or.jp/pub/ic_mag/ic018/intercity/higashi_E.html"
            , "https://www.nybooks.com/articles/2011/03/10/how-we-know/"
            , "https://www.nytimes.com/2014/07/30/world/africa/ransoming-citizens-europe-becomes-al-qaedas-patron.html"
            , "https://www.nzherald.co.nz/nz/officers-link-to-net-drug-market/3MQUK5H6PDVBIZHTDZUG3TITMA/?c_id=1&objectid=10819029"
            , "https://www.odt.co.nz/news/dunedin/student-drug-dealer-jailed"
            , "https://www.oglaf.com/glindr/"
            , "https://www.ohri.ca/programs/clinical_epidemiology/nos_manual.pdf"
            , "https://www.olin.edu/"
            , "https://www.om.nl/actueel/nieuwsberichten/@88570/aanhoudingen/"
            , "https://www.openphilanthropy.org/research/what-should-we-learn-from-past-ai-forecasts/"
            , "https://www.optimizely.com/insights/blog/how-does-page-load-time-impact-engagement/"
            , "https://www.optimox.com/iodine-study-1"
            , "https://www.oreilly.com/library/view/cjkv-information-processing/9780596156114/"
            , "https://www.osti.gov/biblio/10172219"
            , "https://www.outsideonline.com/culture/books-media/how-athletes-get-great/"
            , "https://www.outsideonline.com/outdoor-adventure/exploration-survival/snakebite-antivenom-tim-friede/"
            , "https://www.overcomingbias.com/p/why-not-egg-futureshtml"
            , "https://www.overthinkingit.com/2012/11/08/my-little-pony-plato/"
            , "https://www.packtpub.com/en-us/product/exploring-gpt-3-9781800563193"
            , "https://www.patreon.com/gwern"
            , "https://www.pbs.org/wgbh/nova/article/crispr-grapes/"
            , "https://www.pcworld.com/article/422832/italian-police-shutter-dark-web-marketplace.html"
            , "https://www.petcarerx.com/pcrx/ProductPages/Product.aspx?pid=10983"
            , "https://www.petco.com/shop/en/petcostore/product/friskies-salmon-canned-cat-food"
            , "https://www.peterbloem.nl/blog/transformers"
            , "https://www.petforums.co.uk/threads/strange-things-that-you-cats-do.475528/page-3#post-1065130574"
            , "https://www.phillymag.com/news/2007/06/18/medicine-this-will-keep-you-awake/"
            , "https://www.pixiv.net/users/38983753"
            , "https://www.pluralsight.com/search?q=R"
            , "https://www.pnas.org/doi/full/10.1073/pnas.1320040111"
            , "https://www.poetrynook.com/poem/birdless-country"
            , "https://www.politie.nl/nieuws/2015/maart/9/01-onderzoek-naar-verzilveren-440.000-euro-aan-bitcoins.html"
            , "https://www.polizei.bayern.de/news/presse/aktuell/index.html/222614"
            , "https://www.polygon.com/2020/1/14/21064608/microsoft-kinect-history-rise-and-fall"
            , "https://www.popularmechanics.com/cars/a17477/why-the-hell-do-they-still-make-car-alarms/"
            , "https://www.postandcourier.com/article/20130709/pc16/130709464/1177/lawyer-charleston-man-denies-connection-to-dea-bitcoin-seizure-and-illicit-silk-road-drug-marketplace/"
            , "https://www.preclinicaltrials.eu/"
            , "https://www.pressandjournal.co.uk/fp/news/aberdeen-aberdeenshire/865699/top-banker-cleared-of-defrauding-pensioners-but-fined-for-selling-details-on-dark-web/"
            , "https://www.prnewswire.com/news-releases/400-million-investment-programme-positions-ireland-for-global-leadership-in-genomic-research-and-advanced-life-sciences-300755716.html"
            , "https://www.projectrho.com/public_html/rocket/spacegunexotic.php#propulsion"
            , "https://www.proofofexistence.com/"
            , "https://www.propublica.org/article/when-evidence-says-no-but-doctors-say-yes"
            , "https://www.prospecbio.com/beta_ngf_human"
            , "https://www.psychologicalscience.org/observer/in-appreciation-julian-stanley"
            , "https://www.psychologytoday.com/us/blog/pristine-inner-experience/201110/not-everyone-conducts-inner-speech"
            , "https://www.quantamagazine.org/how-the-slowest-computer-programs-illuminate-maths-fundamental-limits-20201210/"
            , "https://www.quora.com/Do-you-have-any-plans-for-optimizing-Duolingos-vocabulary-learning-using-spaced-repetition"
            , "https://www.rand.org/commentary/2011/05/29/ND.html"
            , "https://www.rbmojournal.com/article/S1472-6483(19)30381-5/fulltext"
            , "https://www.rechem.ca/index.php?_a=viewDoc&docId=8"
            , "https://www.reddit.com/comments/1x0p1b"
            , "https://www.reddit.com/r/haskell/comments/fid5w/haskell_summers_of_code_retrospective_updated_for/c1gutlo/"
            , "https://www.redliongrantchester.co.uk/"
            , "https://www.researchandmarkets.com/reportinfo.asp?report_id=305358"
            , "https://www.research.va.gov/mvp/"
            , "https://www.rightstufanime.com/Utena-Revolutionary-Girl-DVD-Set-3-Apocalypse-Saga-Hyb-Limited-Edition"
            , "https://www.r-inla.org/"
            , "https://www.roangelo.net/logwitt/logwitt5.html"
            , "https://www.rollingstone.com/culture/culture-features/smiley-face-murder-serial-killer-drowning-death-882042/"
            , "https://www.rrauction.com/auctions/lot-detail/31909050347196/"
            , "https://www.rsm.nl/fileadmin/Images_NEW/Departments/TOM/Calis_Thijmen_Thesis.pdf"
            , "https://www.rte.ie/archives/2018/0325/949314-donegal-victorian-romantics/"
            , "https://www.rug.nl/ggdc/productivity/pwt/pwt-releases/pwt-6.1"
            , "https://www.salesforce.com/products/einstein/ai-research/tl-dr-reinforced-model-abstractive-summarization/"
            , "https://www.samharris.org/blog/the-fireplace-delusion"
            , "https://www.sandia.gov/research/facilities/technology_deployment_centers/explosive_component.html"
            , "https://www.sciencedaily.com/releases/2008/05/080505075642.htm"
            , "https://www.sciencedirect.com/science/article/pii/S0191886921003536"
            , "https://www.science.org/content/article/plan-replicate-50-high-impact-cancer-papers-shrinks-just-18"
            , "https://www.science.org/content/article/potential-fabrication-research-images-threatens-key-theory-alzheimers-disease"
            , "https://www.science.org/content/article/these-lab-grown-human-eggs-could-combat-infertility-if-they-prove-healthy"
            , "https://www.scientificamerican.com/article/the-mind-of-an-octopus/"
            , "https://www.scmp.com/news/china/science/article/3002346/chinas-first-cloned-police-dog-reports-duty"
            , "https://www.scotthyoung.com/blog/"
            , "https://www.screendaily.com/awards/hideaki-anno-evangelion/5081255.article?blocktitle=INTERVIEWS&contentID=41866"
            , "https://www.sdfertility.com/fertility-treatments/genetic-testing/pgd"
            , "https://www.seacoastonline.com/story/news/local/hampton-union/2014/05/07/hampton-man-to-plead-guilty/37408765007/"
            , "https://www.sec.gov/Archives/edgar/data/1766502/000119312519124430/d665122ds1.htm"
            , "https://www.semanticscholar.org/paper/Donor-Sibling-Networks-as-a-Vehicle-for-Expanding-Hertz-Nelson/6e736c71cd499fa03af6dabad3009335a8259745?pdf#page=14"
            , "https://www.sendspace.com/file/ozr19p"
            , "https://www.shine.cn/news/metro/1909101776/"
            , "https://www.shroomery.org/forums/showflat.php/Number/18993960"
            , "https://www.si.edu/"
            , "https://www.simonsfoundation.org/2009/07/20/mathematicians-solve-45-year-old-kervaire-invariant-puzzle/"
            , "https://www.slideshare.net/codeblue_jp/igor-skochinsky-enpub"
            , "https://www.smbc-comics.com/?id=3169#comic"
            , "https://www.smh.com.au/technology/teens-visit-hidden-website-for-drugs-20130319-2gddg.html"
            , "https://www.smithsonianmag.com/history/crockfords-club-how-a-fishmonger-built-a-gambling-hall-and-bankrupted-the-british-aristocracy-148268691/"
            , "https://www.snopes.com/fact-check/school-lemonade-laxatives/"
            , "https://www.soci.org/Chemistry-and-Industry/CnI-Data/2010/24/Brussels-a-bittersweet-story"
            , "https://www.sophos.com/fr-fr/medialibrary/PDFs/technical%20papers/samosseikovb2009paper.pdf"
            , "https://www.spacedrepetition.com/"
            , "https://www.sparkfun.com/tutorials"
            , "https://www.spectator.co.uk/article/voters-agree-with-lee-anderson-about-cracking-down-on-crime/"
            , "https://www.speedtest.net/"
            , "https://www.spermbankcalifornia.com/sperm-bank-cost.html#Cryopreservation"
            , "https://www.spiceandtea.com/coconut-oolong-p-587.html?zenid=ot0nli0t5cfvbitsmhi3f2pv16"
            , "https://www.ssa.gov/oact/STATS/table4c6.html"
            , "https://www.ssi.shimadzu.com/products/particle-size-analysis/index.html"
            , "https://www.startupschool.org/"
            , "https://mhooten.github.io/papers/pdf/Hooten_Hobbs_EcolMono_2015.pdf"
            , "https://www.stats.govt.nz/information-releases/births-and-deaths-year-ended-december-2018"
            , "https://www.stevepetersen.net/wittgenstein-fog.html"
            , "https://www.stroudnewsandjournal.co.uk/news/14491113.Bussage_cannabis_dealer_Chance_Gough_avoids_jail_after_ordering_cocaine_delivery_from_Holland/"
            , "https://www.sudowrite.com/"
            , "https://www.supermemo.com/en/blog/application-of-a-computer-to-improve-the-results-obtained-in-working-with-the-supermemo-method"
            , "https://www-sydsvenskan-se.translate.goog/2016-07-15/atal-for-storskalig-narkotikahandel?_x_tr_sl=auto&_x_tr_tl=en&_x_tr_hl=en-US"
            , "https://www.tabletmag.com/sections/news/articles/orthodox-jews-attacked-brooklyn-hate-crime"
            , "https://www.takimag.com/article/the_second_least_glamorous_job_in_showbiz/"
            , "https://www.tandfonline.com/doi/full/10.1080/03949370.2021.1893826"
            , "https://www.taylorusa.com/kitchen/thermometers/5-commercial-anti-microbial-instant-read-thermometer.html"
            , "https://www.teamten.com/lawrence/writings/coding-machines/"
            , "https://www.teasetc.com/"
            , "https://www.teavana.com/us/en/tea/green-tea/gyokuro-genmaicha-green-tea-31440.html"
            , "https://www.technologyreview.com/2020/02/17/844721/ai-openai-moonshot-elon-musk-sam-altman-greg-brockman-messy-secretive-reality/"
            , "https://www.ted.com/talks/christopher_ryan_are_we_designed_to_be_sexual_omnivores"
            , "https://www.teds.ac.uk/about-teds"
            , "https://www.telegraph.co.uk/news/2016/09/16/french-intelligence-cracks-telegram-account-of-most-notorious-is/"
            , "https://www.tennessean.com/story/news/crime/2014/06/01/xanax-pills-seized-hermitage/9847299/"
            , "https://www.tensorflow.org/tensorboard/get_started"
            , "https://www.tga.gov.au/products/unapproved-therapeutic-goods/personal-importation-scheme"
            , "https://www.theadvertiser.com/story/news/crime/2016/08/30/lafayette-man-sentenced-18-months-prison-shipping-drugs-via-silk-road/89604606/"
            , "https://www.theage.com.au/politics/queensland/strawberry-growers-shut-the-farm-gate-after-tampering-crisis-20190402-p519zk.html"
            , "https://www.theatlantic.com/technology/archive/2012/05/the-perfect-milk-machine-how-big-data-transformed-the-dairy-industry/256423/"
            , "https://www.thedailybeast.com/vegan-youtube-is-imploding-as-stars-like-rawvana-bonny-rebecca-and-stella-rae-change-diets"
            , "https://www.thediff.co/archive/how-bubbles-and-megaprojects-parallelize/"
            , "https://www.theguardian.com/technology/2014/may/30/life-after-silk-road-how-the-darknet-drugs-market-is-booming"
            , "https://www.thehomesecuritysuperstore.com/collections/driveway-alarms"
            , "https://www.theladders.com/research-2/3556/"
            , "https://www.thelancet.com/journals/ebiom/article/PIIS2352-3964(19)30591-2/fulltext"
            , "https://www.thelocal.de/20160729/german-darknet-weapons-dealer-sentenced-to-5-years-jail"
            , "https://www.themarshallproject.org/2018/04/19/framed-for-murder-by-his-own-dna"
            , "https://www.thenewatlantis.com/publications/shop-class-as-soulcraft"
            , "https://theonion.com/study-wolf-attacks-still-leading-cause-of-death-in-u-s-1819574862/"
            , "https://www.theringer.com/features/2021/6/21/22542839/disc-golf-niche-sports-million-dollar-endorsement-deals"
            , "https://www.theroot.com/exactly-how-black-is-black-america-1790895185"
            , "https://www.the-scientist.com/features/can-destroying-senescent-cells-treat-age-related-disease--67136"
            , "https://www.thessgac.org/data"
            , "https://www.thestar.com/vancouver/2018/07/05/bc-lays-claim-to-14-million-us-in-bitcoin-from-drug-dealer-over-alleged-links-to-silk-road.html"
            , "https://www.the-tls.co.uk/literature/reference/alternative-to-peer-review-essay-timothy-gowers"
            , "https://www.theverge.com/2021/10/28/22750337/shadow-planet-ai-robin-sloan-jesse-solomon-clark"
            , "https://www.thisamericanlife.org/668/transcript"
            , "https://www.thisstorydoesnotexist.com/"
            , "https://www.thoughtco.com/is-distance-learning-right-for-you-1098087"
            , "https://www.thv11.com/article/news/crime/more-details-man-accused-of-receiving-pot-through-mail/91-100936404"
            , "https://www.ti.com/product/MSP430F2003"
            , "https://www.timeanddate.com/date/durationresult.html?m1=9&d1=16&y1=2012&m2=3&d2=9&y2=2013&ti=on"
            , "https://www.timesofisrael.com/police-investigating-toddler-death-from-nicotine-overdose/"
            , "https://www.tinyletter.com/"
            , "https://www.tn.gov/education/early-learning/voluntary-pre-k.html"
            , "https://www.tomshardware.com/news/google-removing-minix-management-engine-intel,35876.html"
            , "https://topic.com/the-62-year-old-child-genius"
            , "https://www.toplessrobot.com/2010/09/the_12_most_anti-american_anime.php"
            , "https://www.torproject.org/download/"
            , "https://www.torservers.net/donate.html"
            , "https://www.townandcountrymag.com/society/a12108750/personal-protection-dogs/"
            , "https://www.tryhaskell.org/"
            , "https://www.tuftandneedle.com/"
            , "https://www.tweaktown.com/news/32703/industry-analyst-still-unsure-of-the-significance-of-hynix-fire/index.html"
            , "https://www.twitch.tv/videos/416276005#openai"
            , "https://www.typografie.info/3/Schriften/fonts.html/deutsche-zierschrift-r250/"
            , "https://www.typography.com/blog/text-for-proofing-fonts"
            , "https://www.uber.com/us/en/beacon/"
            , "https://www.ukbiobank.ac.uk/frontiers-meeting-london-2014"
            , "https://www.unitedpharmacies-uk.md/Modavigil-Modafinil-100mg-30-Tablets-p-759.html"
            , "https://www.upi.com/Health_News/2011/04/27/Omega-3-may-up-aggressive-prostate-cancer/31131303903320/?u3L=1"
            , "https://www.upjohn.org/data-tools/employment-research-data-center/continuous-longitudinal-manpower-surveys"
            , "https://www.uptontea.com/shopcart/item.asp?itemID=ZH80"
            , "https://www.uscourts.gov/services-forms/federal-court-reporting-program"
            , "https://www.usenix.org/legacy/events/sec99/full_papers/whitten/whitten.ps"
            , "https://www.usenix.org/system/files/1403_02-08_mickens.pdf"
            , "https://www.usgs.gov/special-topics/water-science-school/science/total-water-use-united-states"
            , "https://www.uso.org/about"
            , "https://www.uv.es/sestio/TechRep/tr14-03.pdf"
            , "https://www.verywellhealth.com/thyroid-disease-diagnosis-4013578"
            , "https://www.vg.no/nyheter/i/Ovnm1/fire-paagrepet-for-produksjon-og-nettsalg-av-narkotika"
            , "https://www.vice.com/en/article/gv5x4q/court-docs-show-a-university-helped-fbi-bust-silk-road-2-child-porn-suspects"
            , "https://www.vice.com/en/article/this-researcher-is-tallying-arrests-from-dark-web-markets/"
            , "https://www.vitacost.com/natures-answer-valerian-root-alcohol-free-1-fl-oz"
            , "https://www.vox.com/xpress/2014/10/2/6875031/chickens-breeding-farming-boilers-giant"
            , "https://www.wahpetondailynews.com/oregon-man-accused-of-selling-fentanyl-that-led-to-nd/article_de0df64e-cf41-11e4-af1c-1b8df43f199d.html"
            , "https://www.walesonline.co.uk/news/wales-news/silk-road-20-drug-dealer-9507820"
            , "https://www.walmart.com/ip/Great-Value-Fudge-Mint-Cookies-10-oz/11997740"
            , "https://www.washingtonexaminer.com/magazine/2087681/dagger-and-swagger/"
            , "https://www.washingtonpost.com/news/worldviews/wp/2014/12/17/denmark-stakes-its-claim-in-the-war-for-the-north-pole/"
            , "https://www.watercoolertrivia.com/blog/gpt-3-vs-water-cooler-trivia-participants-a-human-vs-robot-showdown"
            , "https://programs.wcs.org/portals/42/media/file/WSB_Ocelot.pdf"
            , "https://www.wdrb.com/news/louisville-man-accused-of-obtaining-potential-date-rape-drug-online/article_c0f1b63f-c52e-50b5-8233-7403082ac0af.html"
            , "https://www.webcitation.org/6Qj7v6mqd"
            , "https://www.welt.de/regionales/muenchen/article117869257/Fahnder-zerschlagen-Bitcoin-Drogenring-DarkNet.html"
            , "https://www.whio.com/news/news/crime-law/police-4-pound-of-pot-mailed-to-oxford/nkgqT/"
            , "https://www.who.int/classifications/classification-of-diseases"
            , "https://www.wickedlocal.com/story/weymouth-news/2015/03/27/police-weymouth-man-got-mdma/34892786007/"
            , "https://www.williamsondailynews.com/news/4846/two-pill-dealers-sentenced-to-federal-prison-for-drug-crimes/"
            , "https://www.wine-searcher.com/find/jackson+triggs+vidal+ice+rsrv+niagara+peninsula+ontario+canada/1"
            , "https://www.winonadailynews.com/news/local/crime-and-courts/winona-postal-inspector-sniffs-out-dope/article_1b24cfe9-75ef-5407-9d02-a916907f7259.html"
            , "https://www.wireheading.com/"
            , "https://www.wolframalpha.com/input/?i=male+height+distribution"
            , "https://www.worldcat.org/title/42465636"
            , "https://www.wunderground.com/history/airport/KNHK/2012/7/11/CustomHistory.html?dayend=22&monthend=3&yearend=2013&req_city=NA&req_state=NA&req_statename=NA&format=1"
            , "https://www.wzzm13.com/mb/news/crime/meth-laden-express-mail-parcel-brings-charges-for-holland-man/287645651"
            , "https://www.xilinx.com/prs_rls/silicon_spart/0333spartan3.htm"
            , "https://www.xn--4dbcyzi5a.com/%d7%9e%d7%94%d7%95%d7%9c%d7%a0%d7%93-%d7%91%d7%90%d7%94%d7%91%d7%94-%d7%a0%d7%aa%d7%a4%d7%a1-%d7%a6%d7%a2%d7%99%d7%a8-%d7%a9%d7%94%d7%96%d7%9e%d7%99%d7%9f-%d7%97%d7%91%d7%99%d7%9c%d7%95%d7%aa-%d7%a7/"
            , "https://www.ycombinator.com/documents/"
            , "https://www.youtube.com/channel/UCeNwyKuv5SMnN6ovlpbz1SQ"
            , "https://www.youtube.com/watch?v=dQw4w9WgXcQ"
            , "https://www.youtube.com/watch?v=hB6eY73sLV0"
            , "https://wyclif.substack.com/p/the-natural-selection-paper-part-908"
            , "https://yippy.ai/skymind"
            , "https://yourmorals.org/"
            , "https://yp.flutterguy.org/"
            , "https://yunnansourcing.com/collections/flower-and-herbal-teas/products/yunnan-sun-dried-wild-rose-buds-from-wenshan"
            , "https://yunnansourcing.us/"
            , "https://zerocoin.org/"
            , "https://z-lib.is/fulltext"
            , "http://thecodelesscode.com/case/96"
            , "https://thesecatsdonotexist.com/"
            , "http://thismarketingblogdoesnotexist.com/"
            , "http://tom7.org/mario/"
            , "http://torch.ch/"
            , "https://uberty.org/wp-content/uploads/2015/07/Norbert_Wiener_Cybernetics.pdf"
            , "https://umichrl.pbworks.com/w/page/7597597/Successes%20of%20Reinforcement%20Learning"
            , "https://vanishingpoint.air-nifty.com/blog/2008/08/post_7c10.html"
            , "https://whatis.suburbansenshi.com/index.php?title=Gemini_Sunrise"
            , "https://williamsburgmarketplace.com/webapp/wcs/stores/servlet/ProductView?categoryId=14332&catalogId=12122"
            , "https://worrydream.com/LearnableProgramming/"
            , "https://worrydream.com/refs/Hamming_1997_-_The_Art_of_Doing_Science_and_Engineering.pdf#page=16"
            , "https://wiki.evageeks.org/FGC:Episode_01_Scene_03"
            , "https://www2003.org/cdrom/papers/refereed/p097/P97%20sources/p97-fetterly.html"
            , "http://www.aaronsw.com/weblog/000404"
            , "https://www.abetterpage.com/wt/euro/BraunT3.html"
            , "https://www.alljapaneseallthetime.com/blog/you-dont-have-a-foreign-language-problem-you-have-an-adult-literacy-problem/"
            , "https://www.bartokdesign.com/japan/0-blog_news/spherical_drain_plug_1.php"
            , "http://www-biba.inrialpes.fr/Jaynes/cc18i.pdf"
            , "http://www.bronxbanterblog.com/2013/10/01/the-power-and-the-gory/"
            , "https://www.buttercupfestival.com/poetry.htm"
            , "http://www.byrnehobart.com/blog/why-are-middlebrow-dismissals-so-tempting/"
            , "http://www.cap-lore.com/Hardware/Wheel.html"
            , "http://www.catb.org/jargon/html/R/religious-issues.html"
            , "https://www.cehd.umn.edu/CAREI/Reports/summary.html#SchoolStart"
            , "http://www.collisiondetection.net/mt/archives/2013/07/wired_love_a_ta.php"
            , "https://www.comicbox.co.jp/e-nau/toren.html"
            , "https://www.cs.cornell.edu/~caruana/compression.kdd06.pdf"
            , "http://www.dailyfinance.com/2010/02/06/girl-scout-cookies-by-the-numbers-just-where-do-all-those-dolla/"
            , "https://www.dcscience.net/2015/12/11/placebo-effects-are-weak-regression-to-the-mean-is-the-main-reason-ineffective-treatments-appear-to-work/"
            , "https://www.ditext.com/moore/common-sense.html"
            , "http://www.dobuusagi.com/"
            , "https://www.ecns.cn/news/cns-wire/2019-03-19/detail-ifzfmzhu2193677.shtml"
            , "https://www.elon.edu/docs/e-web/academics/business/economics/faculty/rouse/2011-02-14%20The%20Impact%20of%20year%20round%20schooling.pdf"
            , "https://www.eoht.info/page/Feynman%27s%20IQ"
            , "http://www.epjournal.net/blog/2011/08/glucose-is-not-willpower-fuel/"
            , "http://www.evalegend.com/interview_anno97.php"
            , "http://www.faqs.org/faqs/compression-faq/"
            , "http://www.ff7citadel.com/press/int_edge.shtml"
            , "http://www.gainax.co.jp/wp/"
            , "http://www.getlamp.com/"
            , "http://www.highbeam.com/doc/1P2-869220.html"
            , "http://www.holidaymead.com/#!product-page/cba4/f8f43032-665c-5a4c-6756-1ac355b32549"
            , "https://www.longecity.org/forum/page/index.html"
            , "http://www.infinitychess.com/Page/Public/Article/DefaultArticle.aspx?id=118"
            , "https://www.infinityplus.co.uk/stories/colderwar.htm"
            , "https://www.iqout.com/"
            , "https://www.iqtest.dk/main.swf"
            , "https://www.jackkinsella.ie/articles/janki-method"
            , "http://www.jacurutu.com/viewtopic.php?f=21&t=1112#p34878"
            , "http://www.jacurutu.com/viewtopic.php?t=2690"
            , "https://www.locusmag.com/2002/Issue09/GaimanWolfe.html"
            , "https://www.longevityhistory.com/read-the-book-online/"
            , "http://www.mangauk.com/?p=annos-dominus"
            , "https://www.mediafire.com/error.php?errno=320&origin=download"
            , "https://www.mindsparke.com/"
            , "https://www.mit.edu/people/rei/manga-inoue.html"
            , "http://www.nausicaa.net/miyazaki/interviews/aboutanime.html"
            , "https://www.nicovideo.jp/watch/sm22678844"
            , "https://www.nicovideo.jp/watch/sm23047550"
            , "https://github.com/robert7/nixnote2"
            , "https://www.northjersey.com/news/222120551_High_schools__early_starts_deprive_students_of_crucial_sleep.html/?page=all"
            , "https://nyaa.si/?page=view&tid=438733"
            , "https://www.oliverwinery.com/index.cfm?method=storeproducts.showdrilldown&productid=565D8BC6-1CC4-FBB6-23C6-013703DB5D6A"
            , "http://www.polizei.sachsen.de/de/MI_2015_34938.htm"
            , "http://www.progressive.org/images/pdf/1179.pdf"
            , "http://www.protoculture.ca/PA/edito42.htm"
            , "http://www.ratbehavior.org/DumboRatMutation.htm"
            , "http://www.rean-wings.net/chara01.html"
            , "http://www.replicatedtypo.com/chocolate-consumption-traffic-accidents-and-serial-killers/5718.html"
            , "http://www.rocketpunk-manifesto.com/2009/06/space-warfare-i-gravity-well.html"
            , "http://www.scholarpedia.org/article/N-body_choreographies"
            , "http://www.scifiscripts.com/scripts/2001.txt"
            , "http://www.sebastianmarshall.com/a-slightly-more-cautious-take-on-modafinil"
            , "http://www.seistronix.com/"
            , "http://www.sequentialtart.com/archive/mar04/cv_0304_2.shtml"
            , "http://www.sfawardswatch.com/?page_id=106"
            , "http://www.smarternootropics.com/2012/01/cephalon-europe-discontinues-olmifon-adrafinil/"
            , "https://www.smartpowders.com/p-5327-l-theanine-powder-20-grams.aspx"
            , "https://www.snpp.com/"
            , "http://www.southwales-eveningpost.co.uk/Gorseinon-man/story-28084851-detail/story.html"
            , "http://www.stuartcheshire.org/rants/latency.html"
            , "http://www.theannals.com/content/45/4/476"
            , "http://www.trixietracker.com/pricing/"
            , "http://www.usagi.org/doi/seiyuu/radio/boogie/19970118.html"
            , "http://www.wangafu.net/~nickm/"
            , "http://www.wdaz.com/news/3691219-number-defendants-charged-fentanyl-overdoses-5"
            , "http://www.weidai.com/bmoney.txt"
            , "https://www.whirlpool.com/-%5BACQ189XS%5D-1004030/ACQ189XS/"
            , "https://wikiwix.com/"
            , "https://www.willatworklearning.com/2005/11/research_review.html"
            , "https://www.xinhuanet.com/english/2019-08/23/c_138332084.htm"
            , "https://academic.oup.com/ageing/article/37/1/25/24810"
            , "https://academic.oup.com/endo/article/160/5/1057/5381910"
            , "https://academic.oup.com/ije/article/50/5/1615/6274255"
            , "https://journals.biologists.com/jeb/article/218/1/123/13627/The-developmental-origins-of-chronic-physical"
            , "https://github.blog/news-insights/product-news/new-year-new-github/"
            , "https://diabetesjournals.org/care/article/37/9/2557/29366/The-Lifetime-Cost-of-Diabetes-and-Its-Implications"
            , "https://boards.fireden.net/ic/thread/3820909/"
            , "https://archive.is/VY8e2"
            , "https://nyaa.si/view/395795"
            , "https://github.com/mnater/Hyphenopoly/blob/master/LICENSE"
            , "https://www.biology.ualberta.ca/locke.hp/dougandbill.htm"
            , "http://incompleteideas.net/sutton/book/the-book.html"
            , "http://www.incompleteideas.net/book/the-book-2nd.html"
            , "https://www.harvey.ai/"
            , "https://www.reuters.com/article/2011/11/26/us-vitamind-heartdisease-idUSTRE7AO1UM20111126"
            , "https://cvm.missouri.edu/research/feline-genetics-and-comparative-medicine-laboratory/feline-genome-project-research-resources/cat-genomic-resources-strs-snps/"
            , "https://data.bls.gov/cgi-bin/cpicalc.pl?cost1=1&year1=199201&year2=201101"
            , "https://jov.arvojournals.org/article.aspx?articleid=2140824"
            , "https://discoverbooks.com/"
            , "https://www.fathomevents.com/series/the-met-live-in-hd/"
            , "https://www.iarpa.gov/index.php/research-programs/ace"
            , "https://www.rosebud.ai/"
            , "https://karger.com/nps/article-abstract/32/3/161/230614/Effects-of-Cigarette-Smoking-on-Performance-in-a"
            , "https://www.davidsongifted.org/Search-Database/entry/A10489"
            , "https://project-imas.wiki/Miki_Hoshii"
            , "https://vitalik.eth.limo/general/2019/11/22/progress.html"
            , "https://github.com/fyu/lsun"
            , "http://garote.bdmonkeys.net/commandline/"
            , "https://diff.wikimedia.org/2012/03/27/analysis-of-the-quality-of-newcomers-in-wikipedia-over-time/"
            , "https://animate-your-word.github.io/demo/"
            , "http://iodineresearch.com/files/cann_2006_iodine_in_cardiovascular_disease.pdf"
            , "http://members.madasafish.com/~cj_whitehound/Fanfic/fanonvscanon.htm"
            , "https://3quarksdaily.com/3quarksdaily/2011/06/a-crab-canon-for-douglas-hofstadter.html"
            , "https://ai.meta.com/blog/code-llama-large-language-model-coding/"
            , "https://blog.daviskedrosky.com/p/did-profits-from-slavery-finance"
            , "https://research.google/blog/using-deep-learning-to-create-professional-level-photographs/"
            , "https://civitai.com/"
            , "https://classic.clinicaltrials.gov/ct2/show/NCT00352170"
            , "https://cwe.mitre.org/data/definitions/330.html"
            , "https://deepmind.google/"
            , "https://figshare.com/articles/media/Egyptian_Vulture_parental_cooperation/12111621"
            , "https://fonts.google.com/specimen/Cinzel+Decorative?category=Display&preview.text=ABCDEFGHIJKLMNOPQRSUVWXYZ&preview.text_type=custom"
            , "https://nap.nationalacademies.org/catalog/11927/distributed-remote-sensing-for-naval-undersea-warfare-abbreviated-version"
            , "https://news.microsoft.com/2019/07/22/openai-forms-exclusive-computing-partnership-with-microsoft-to-build-new-azure-ai-supercomputing-technologies/"
            , "https://psychology.wvu.edu/about/history/expansion-of-the-psychology-faculty-at-wvu-in-the-1950s"
            , "https://pubs.aip.org/ajp/article-supplement/2911822/zip/819_1_5.0150209.suppl_material/"
            , "https://shs.hal.science/halshs-00118626/document"
            , "https://solar.lowtechmagazine.com/"
            , "https://supp.apa.org/psycarticles/supplemental/abn0000867/ABN-2023-0045_Suppl.docx"
            , "https://tim.blog/2018/01/01/the-tim-ferriss-show-transcripts-assessing-risk-and-living-without-a-rope-lessons-from-alex-honnold/"
            , "https://www.anthropic.com/"
            , "https://www.clinicaltrialsregister.eu/"
            , "https://www.crunchbase.com/organization/predictious"
            , "https://www.daviddarling.info/encyclopedia/D/DysonF.html"
            , "https://www.genecards.org/cgi-bin/carddisp.pl?gene=MFSD2B"
            , "https://www.henrikkarlsson.xyz/p/apprenticeship-online"
            , "https://www.inverse.com/article/53442-this-person-does-not-exist-has-spawned-a-host-of-a-i-powered-copycats"
            , "https://www.journals.uchicago.edu/doi/suppl/10.1086/721270/suppl_file/10286Data.zip"
            , "https://www.linkedin.com/in/jon-levy-b98986b3"
            , "https://www.noahpinion.blog/p/bangladesh-is-the-new-asian-tiger"
            , "https://www.robots.ox.ac.uk/~vgg/data/fgvc-aircraft/"
            , "https://www.theinformation.com/articles/at-booming-toptal-no-stock-for-employees-or-investors"
            , "https://www.theintrinsicperspective.com/p/how-geniuses-used-to-be-raised"
            , "https://www.tiktok.com/@dale_ebert/video/7301073510267407658"
            , "https://www.whitehouse.gov/briefing-room/speeches-remarks/2022/09/16/remarks-by-national-security-advisor-jake-sullivan-at-the-special-competitive-studies-project-global-emerging-technologies-summit/"
            , "https://www.yahoo.com/lifestyle/kanye-west-says-misdiagnosed-bipolar-disorder-sleep-deprivation-000405518.html"
            , "https://zenodo.org/records/10035659"
            , "https://apnews.com/article/a6a67fb761304e3cae7497faa32dcdc9"
            , "https://apnews.com/article/kansas-city-chiefs-philadelphia-eagles-technology-science-82bc20f207e3e4cf81abc6a5d9e6b23a"
            , "https://research.com/u/gudmar-thorleifsson-1"
            , "https://allenai.org/"
            , "https://dnstats.net/market/Nucleus+Market"
            , "https://en.bitcoin.it/wiki/Proof_of_Stake"
            , "https://humanvarieties.org/2013/01/15/100-years-of-testing-negro-intelligence/"
            , "https://kill-the-newsletter.com/"
            , "https://marginalrevolution.com/marginalrevolution/2013/04/trade-vs-technology-in-terms-of-their-labor-market-effects.html"
            , "https://philpapers.org/archive/SOTAOA.pdf#miri"
            , "https://philpapers.org/browse/the-reflection-principle"
            , "https://readwrite.com/armed_with_social_signals_google_moves_back_toward/"
            , "https://statmodeling.stat.columbia.edu/2010/11/03/some_thoughts_o_8/"
            , "https://statmodeling.stat.columbia.edu/2014/08/28/publication-bias-social-sciences-unlocking-file-drawer2/"
            , "https://www.otakustudy.com/books/2020/08/skeb-artwork-commissioning-website-review/"
            , "https://www.politico.com/magazine/story/2018/11/11/republican-party-anti-pornography-politics-222096/"
            , "https://www.theparisreview.org/interviews/4155/the-art-of-the-essay-no-1-e-b-white"
            , "https://www.axios.com/2023/09/08/walter-isaacson-elon-musk-book-excerpt"
            , "https://blog.novelai.net/data-efficient-language-transfer-with-gpt-j-45daedaaf35a"
            , "https://medicalxpress.com/news/2011-08-vitamin-pills-undermine.html"
            , "https://phys.org/news/2019-12-mouse-pups-born-eggs-derived.html"
            , "https://www.bartleby.com/lit-hub/poetry-of-byron/greece-iv/"
            , "https://ki.se/en/people/anders-hamsten"
            , "https://pmc.ncbi.nlm.nih.gov/articles/PMC10587091/"
            , "https://www.manifold1.com/"
            , "https://www.dwarkesh.com/p/gwern-branwen"
            , "https://jamanetwork.com/journals/jama/fullarticle/183580"
            , "https://jamanetwork.com/journals/jamainternalmedicine/fullarticle/1108810"
            , "https://jamanetwork.com/journals/jamainternalmedicine/fullarticle/414784"
            , "https://jamanetwork.com/journals/jamapsychiatry/fullarticle/2569454"
            , "https://www.midjourney.com/home/"
            , "https://www.mrc-epid.cam.ac.uk/cds2024/faculty/ines-barroso/"
            , "https://wiki.c2.com/?LazinessImpatienceHubris"
            , "https://www.wsj.com/articles/SB10001424053111903480904576512250915629460"
            , "https://scholarship.law.upenn.edu/cgi/viewcontent.cgi?article=1022&context=penn_law_review"
            , "https://old.reddit.com/r/mlscaling/comments/1ik3401/mistral_offers_deepseek_r1_llama70b_at_1500/mbjb9t4/"
            , "https://www.reddit.com/r/mlscaling/comments/1ik3401/mistral_offers_deepseek_r1_llama70b_at_1500/mbjb9t4/"
            , "https://www.medium.com/@monicah428/the-early-days-of-valve-from-a-woman-inside-bf80c6b47961"
            , "https://neojaponisme.com/"
            , "https://www.larryniven.net/?q=yet-another-modest-proposal-the-roentgen-standard"
            , "https://www.cs.ox.ac.uk/people/yarin.gal/website/blog_3d801aa532c1ce.html"
            , "https://www.librarything.com/work/13068"
            , "https://www.cia.gov/readingroom/collection/doctor-zhivago"
            , "https://www.lifeview.com/ehs"
            , "https://www.statnews.com/2020/09/24/crows-possess-higher-intelligence-long-thought-primarily-human/"
            , "https://www.dhammawiki.com/index.php/Buddha%27s_Lists"
            , "https://docs.midjourney.com/hc/en-us/articles/32099348346765-Chaos-Variety"
            , "https://reactormag.com/day-of-the-kraken/"
            , "https://drive.google.com/file/d/0B4wY8oEgAUnjX3NzSUJCNVZHbmc/view" -- NOTE: deliberately dead link used, as it will never need to be search-and-replaced
            , "https://www.w3.org/International/wiki/Case_folding"
            , "https://en.wikifur.com/wiki/History"
            , "https://ew.com/tv/2017/10/12/frankie-muniz-memory-loss/"
            , "https://fibery.io/blog/gems/hypertext-tools-from-the-80s/"
            , "https://freakonomics.com/2011/05/mining-for-correlations-it-works/#comment-244672"
            , "https://antifandom.com/mlp/wiki/Explore_Equestria:_Greatest_Hits"
            ]

