├── .about.com.txt ├── .allthingsd.com.txt ├── .blog.163.com.txt ├── .blog.hu.txt ├── .blogs.nytimes.com.txt ├── .blogspot.com.txt ├── .businessinsider.com.txt ├── .cnet.com.txt ├── .craigslist.org.txt ├── .ctv.ca.txt ├── .dreamwidth.org.txt ├── .dxy.cn.txt ├── .editorconfig ├── .elpais.com.txt ├── .etc.se.txt ├── .ew.com.txt ├── .fivefilters.org.txt ├── .fok.nl.txt ├── .globo.com.txt ├── .hardware.info.txt ├── .ietf.org.txt ├── .ifeng.com.txt ├── .ihned.cz.txt ├── .lingolia.com.txt ├── .livejournal.com.txt ├── .m.wikihow.com.txt ├── .medium.com.txt ├── .metafilter.com.txt ├── .mitpress.mit.edu.txt ├── .mozilla.org.txt ├── .nasa.gov.txt ├── .nytimes.com.txt ├── .onliner.by.txt ├── .orf.at.txt ├── .philhist.unibas.ch.txt ├── .playblackdesert.com.txt ├── .quora.com.txt ├── .readthedocs.io.txt ├── .redbullmusicacademy.com.txt ├── .repubblica.it.txt ├── .reuters.com.txt ├── .rmt.yml ├── .robweychert.com.txt ├── .schwab.com.txt ├── .signal-arnaques.com.txt ├── .simonwillison.net.txt ├── .slashdot.org.txt ├── .smashingmagazine.com.txt ├── .sodexo.com.txt ├── .sputniknews.com.txt ├── .stackexchange.com.txt ├── .stanford.edu.txt ├── .statista.com.txt ├── .substack.com.txt ├── .theinventory.com.txt ├── .theonion.com.txt ├── .theplayerstribune.com.txt ├── .time.com.txt ├── .tvbs.com.tw.txt ├── .tweakblogs.net.txt ├── .usinenouvelle.com.txt ├── .vanityfair.com.txt ├── .visualcapitalist.com.txt ├── .watson.de.txt ├── .wikihow.com.txt ├── .wikimedia.org.txt ├── .wikipedia.org.txt ├── .wired.com.txt ├── .wordpress.com.txt ├── .wp.pl.txt ├── .wyborcza.biz.txt ├── .wyborcza.pl.txt ├── .yahoo.com.txt ├── 01net.com.txt ├── 16personalities.com.txt ├── 20min.ch.txt ├── 20minutes.fr.txt ├── 24.ae.txt ├── 24a11y.com.txt ├── 24auto.de.txt ├── 24garten.de.txt ├── 24hamburg.de.txt ├── 24joursdeweb.fr.txt ├── 24rhein.de.txt ├── 24vita.de.txt ├── 24ways.org.txt ├── 36kr.com.txt ├── 37signals.com.txt ├── 3quarksdaily.com.txt ├── 3voor12.vpro.nl.txt ├── 404media.co.txt ├── 43folders.com.txt ├── 500px.com.txt ├── 512pixels.net.txt ├── 5by5.tv.txt ├── 7newsbelize.com.txt ├── 8e-etage.fr.txt ├── 9gag.com.txt ├── 9to5google.com.txt ├── 9to5mac.com.txt ├── LICENSE.txt ├── Makefile ├── RMT ├── a.tldrnewsletter.com.txt ├── a11ywithlindsey.com.txt ├── aachener-nachrichten.de.txt ├── aarp.org.txt ├── abc-luxe.com.txt ├── abc.es.txt ├── abc.net.au.txt ├── abcnews.go.com.txt ├── abendblatt.de.txt ├── abendzeitung-muenchen.de.txt ├── abplive.com.txt ├── academic.oup.com.txt ├── academiedugout.fr.txt ├── accaglobal.com.txt ├── access.redhat.com.txt ├── accesstoinsight.org.txt ├── achgut.com.txt ├── acidcow.com.txt ├── aclu.org.txt ├── acroswing.fr.txt ├── actualitte.com.txt ├── ad.nl.txt ├── addendum.org.txt ├── adfc-nrw.de.txt ├── adme.ru.txt ├── admin-magazin.de.txt ├── adslzone.net.txt ├── aei.org.txt ├── aeon.co.txt ├── aerobuzz.fr.txt ├── afr.com.txt ├── africaintelligence.fr.txt ├── aftenposten.no.txt ├── aftonbladet.se.txt ├── agirpourlatransition.ademe.fr.txt ├── aht.seriouseats.com.txt ├── aif.ru.txt ├── aitnews.com.txt ├── akweb.de.txt ├── al-monitor.com.txt ├── albayan.ae.txt ├── alberta.ca.txt ├── alex.mullr.net.txt ├── alexduner.com.txt ├── alexmurrell.co.uk.txt ├── alicewalkersgarden.com.txt ├── alimentation-generale.fr.txt ├── alistapart.com.txt ├── aljazeera.com.txt ├── allafrica.com.txt ├── allgemeine-zeitung.de.txt ├── allphly.com.txt ├── allrecipes.com.txt ├── allthingsd.com.txt ├── allyou.com.txt ├── alphabeta.argaam.com.txt ├── alriyadh.com.txt ├── alsacreations.com.txt ├── alseraj.net.txt ├── altaonline.com.txt ├── alternatives-economiques.fr.txt ├── alternator.science.txt ├── alternet.org.txt ├── altfoto.com.txt ├── alumni.stanford.edu.txt ├── amandala.com.bz.txt ├── amazon.com.txt ├── americandrink.net.txt ├── americanprogress.org.txt ├── americanthinker.com.txt ├── americastestkitchenfeed.com.txt ├── amp.themercury.com.au.txt ├── amptoons.com.txt ├── anandtech.com.txt ├── androidandme.com.txt ├── androidcentral.com.txt ├── androidpolice.com.txt ├── andy-bell.design.txt ├── angrymetalguy.com.txt ├── annatravelling.wordpress.com.txt ├── annouchka.fr.txt ├── ansible.com.txt ├── answersresearchjournal.org.txt ├── antigone21.com.txt ├── antirez.com.txt ├── aoc.media.txt ├── apache.be.txt ├── apnews.com.txt ├── apotheke-adhoc.de.txt ├── apple.com.txt ├── apple.news.txt ├── appleinsider.com.txt ├── appleweblog.com.txt ├── aps.dz.txt ├── araraneon.com.br.txt ├── archdaily.com.txt ├── archiloque.net.txt ├── architecturaldigest.com.txt ├── archive.pressthink.org.txt ├── archiveofourown.org.txt ├── archlinux.de.txt ├── arduino-tutorial.de.txt ├── arretsurimages.net.txt ├── arstechnica.com.txt ├── artforum.com.txt ├── articles.courant.com.txt ├── articles.washingtonpost.com.txt ├── artofmanliness.com.txt ├── artresilia.com.txt ├── artsixmic.fr.txt ├── arxiv-vanity.com.txt ├── arxiv.org.txt ├── ascarter.net.txt ├── askingbox.de.txt ├── astronews.com.txt ├── astronomy.com.txt ├── asymco.com.txt ├── atlantico.fr.txt ├── atlasobscura.com.txt ├── au.lifehacker.com.txt ├── au.news.yahoo.com.txt ├── auto-motor-und-sport.de.txt ├── autoactu.com.txt ├── autoblog.com.txt ├── autocar.co.uk.txt ├── autocrypt.org.txt ├── automobil-produktion.de.txt ├── autoplus.fr.txt ├── avantivictoirerao.com.txt ├── avclub.com.txt ├── aws.amazon.com.txt ├── axesslab.com.txt ├── axiocap.com.txt ├── axios.com.txt ├── az-online.de.txt ├── backlinko.com.txt ├── bahnblogstelle.com.txt ├── baltimoresun.com.txt ├── barrons.com.txt ├── baseballprospectus.com.txt ├── basicthinking.de.txt ├── basketeurope.com.txt ├── bastamag.net.txt ├── bastibe.de.txt ├── batenka.ru.txt ├── baylon-industries.com.txt ├── bbc.co.uk.txt ├── bbc.com.txt ├── bbcgoodfood.com.txt ├── bbva.es.txt ├── bdaily.co.uk.txt ├── bearmetal.eu.txt ├── becomingminimalist.com.txt ├── begeek.fr.txt ├── ben-evans.com.txt ├── benoitmaison.org.txt ├── berlingske.dk.txt ├── bernama.com.txt ├── bernardinai.lt.txt ├── besabine.com.txt ├── betabeat.com.txt ├── betanews.com.txt ├── bez.es.txt ├── bgland24.de.txt ├── bild.de.txt ├── biography.com.txt ├── birthdayshoes.com.txt ├── bit-tech.net.txt ├── bitelia.com.txt ├── bizjournals.com.txt ├── bjango.com.txt ├── blast-info.fr.txt ├── bleacherreport.com.txt ├── blog.angular.io.txt ├── blog.asmartbear.com.txt ├── blog.chriszacharias.com.txt ├── blog.cloudflare.com.txt ├── blog.dropbox.com.txt ├── blog.eleven-labs.com.txt ├── blog.eng.xogrp.com.txt ├── blog.engineering.publicissapient.fr.txt ├── blog.fefe.de.txt ├── blog.imirhil.fr.txt ├── blog.instagram.com.txt ├── blog.instapaper.com.txt ├── blog.kaelig.fr.txt ├── blog.landr.com.txt ├── blog.lepine.pro.txt ├── blog.lumen.com.txt ├── blog.mochi.is.txt ├── blog.mondediplo.net.txt ├── blog.mozilla.org.txt ├── blog.native-instruments.com.txt ├── blog.naver.com.txt ├── blog.netinfluence.ch.txt ├── blog.nightly.mozilla.org.txt ├── blog.octo.com.txt ├── blog.pchome.net.txt ├── blog.pinboard.in.txt ├── blog.professeurjoachim.com.txt ├── blog.rchapman.org.txt ├── blog.renren.com.txt ├── blog.robertelder.org.txt ├── blog.rust-lang.org.txt ├── blog.sentry.io.txt ├── blog.serverlessadvocate.com.txt ├── blog.shaunfinglas.co.uk.txt ├── blog.sina.com.cn.txt ├── blog.spu.edu.txt ├── blog.squad.fr.txt ├── blog.terkel.io.txt ├── blog.trello.com.txt ├── blog.twitter.com.txt ├── blog.wells.ee.txt ├── blog.xebia.fr.txt ├── blog.youb.fr.txt ├── blogs.faz.net.txt ├── blogs.forbes.com.txt ├── blogs.gnome.org.txt ├── blogs.hbr.org.txt ├── blogs.lse.ac.uk.txt ├── blogs.oracle.com.txt ├── blogs.reuters.com.txt ├── blogs.sciencemag.org.txt ├── blogs.smithsonianmag.com.txt ├── blogs.technet.com.txt ├── bloomberg.com.txt ├── boagworld.com.txt ├── boards.greenhouse.io.txt ├── bobbyromeo.com.txt ├── bohaishibei.com.txt ├── boingboing.net.txt ├── bonpote.com.txt ├── book.douban.com.txt ├── bookforum.com.txt ├── borderhouseblog.com.txt ├── bosch-presse.de.txt ├── bostonglobe.com.txt ├── bostonreview.net.txt ├── boundlessline.org.txt ├── boxingnewsonline.net.txt ├── bpb.de.txt ├── br.de.txt ├── brainfacts.org.txt ├── brainpickings.org.txt ├── brandeins.de.txt ├── brandingstrategyinsider.com.txt ├── brasil.elpais.com.txt ├── braunschweiger-zeitung.de.txt ├── breitengrad-nord.de.txt ├── brentozar.com.txt ├── brettterpstra.com.txt ├── briefly.co.za.txt ├── brightside.me.txt ├── brit.co.txt ├── brookings.edu.txt ├── brooksreview.net.txt ├── brucelawson.co.uk.txt ├── bt.no.txt ├── buerstaedter-zeitung.de.txt ├── buffed.de.txt ├── buildvirtual.net.txt ├── buquad.com.txt ├── business-standard.com.txt ├── business.time.com.txt ├── business2community.com.txt ├── businessinsider.com.au.txt ├── businessinsider.com.txt ├── businessnews.com.tn.txt ├── businessweek.com.txt ├── buzzfeed.com.txt ├── buzzfeed.de.txt ├── bw24.de.txt ├── bzg.fr.txt ├── c.newsnow.co.uk.txt ├── c.newsnow.com.txt ├── cabinetmagazine.org.txt ├── cable.co.uk.txt ├── cafebabel.com.txt ├── caffereggio.net.txt ├── cairn.info.txt ├── callistaenterprise.se.txt ├── canardpc.com.txt ├── canonrumors.com.txt ├── captaineconomics.fr.txt ├── car-it.com.txt ├── caravanmagazine.in.txt ├── cardboardconnection.com.txt ├── carlchenet.com.txt ├── carnegie.ru.txt ├── carnegieeurope.eu.txt ├── cars.com.txt ├── caseinterview.com.txt ├── cashless.pl.txt ├── catapult.co.txt ├── catb.org.txt ├── cbsnews.com.txt ├── cell.com.txt ├── cert-bund.de.txt ├── certaintynews.com.txt ├── cfclrk.com.txt ├── cgtrader.com.txt ├── champeau.info.txt ├── chaperonsetvous.fr.txt ├── chareidi.org.txt ├── charlotteobserver.com.txt ├── chat.openai.com.txt ├── chefkoch.de.txt ├── chicagotribune.com.txt ├── chiemgau24.de.txt ├── china-gadgets.de.txt ├── chip.de.txt ├── choice.com.au.txt ├── chomsky.info.txt ├── chrisltd.com.txt ├── christianitytoday.com.txt ├── christies.com.txt ├── chrome.google.com.txt ├── chronicle.com.txt ├── ciaosamin.com.txt ├── cicero.de.txt ├── cio.com.txt ├── ciperchile.cl.txt ├── cityam.com.txt ├── citylab.com.txt ├── cjr.org.txt ├── clarin.com.txt ├── classcentral.com.txt ├── cleafy.com.txt ├── cleantechnica.com.txt ├── clientk.com.txt ├── cloud.google.com.txt ├── cloudacademy.com.txt ├── clubic.com.txt ├── cmace.de.txt ├── cmns.umd.edu.txt ├── cmswire.com.txt ├── cn.engadget.com.txt ├── cn.nytimes.com.txt ├── cn.reuters.com.txt ├── cnbc.com.txt ├── cnet.com.txt ├── cnetfrance.fr.txt ├── cnews.ru.txt ├── cnn.com.txt ├── cnrs.fr.txt ├── cntraveller.com.txt ├── coalicionporelevangelio.org.txt ├── code.activestate.com.txt ├── code.google.com.txt ├── codebase64.org.txt ├── codeproject.com.txt ├── codinghorror.com.txt ├── codyhosterman.com.txt ├── coffeecircle.com.txt ├── cohost.org.txt ├── cointelegraph.com.txt ├── collective-evolution.com.txt ├── collegehumor.com.txt ├── columbiaspectator.com.txt ├── come-on.de.txt ├── commentarymagazine.com.txt ├── commitstrip.com.txt ├── commondreams.org.txt ├── commonwealmagazine.org.txt ├── communities-dominate.blogs.com.txt ├── community.element14.com.txt ├── community.openstreetmap.org.txt ├── community.readeck.org.txt ├── composer.json ├── composer.spitfireaudio.com.txt ├── computerbase.de.txt ├── computerworld.com.txt ├── computerworld.dk.txt ├── consortiumnews.com.txt ├── consumerreports.org.txt ├── contexte.com.txt ├── contrepoints.org.txt ├── cookies.frankwatching.com.txt ├── cooking.nytimes.com.txt ├── cooper.com.txt ├── core77.com.txt ├── correctiv.org.txt ├── costanachrichten.com.txt ├── counterpunch.org.txt ├── countrylife.co.uk.txt ├── courrierdesbalkans.fr.txt ├── courrierdeuropecentrale.fr.txt ├── courrierinternational.com.txt ├── crikey.com.au.txt ├── crimemagazine.com.txt ├── crimereads.com.txt ├── crimethinc.com.txt ├── criterion.com.txt ├── crn.de.txt ├── crunchyroll.com.txt ├── csmonitor.com.txt ├── csnphilly.com.txt ├── csoonline.com.txt ├── css-tricks.com.txt ├── csswizardry.com.txt ├── ctxt.es.txt ├── cucharasonica.com.txt ├── cultofmac.com.txt ├── culturebd.com.txt ├── custom └── nerdy.dev.txt ├── cw.com.tw.txt ├── cwnp.com.txt ├── cyrille-borne.com.txt ├── da.feedsportal.com.txt ├── dadall.info.txt ├── dafoster.net.txt ├── dagogtid.no.txt ├── daily-osm-tips.getsendstack.com.txt ├── dailydot.com.txt ├── dailykos.com.txt ├── dailymail.co.uk.txt ├── dailymaverick.co.za.txt ├── dailymotion.com.txt ├── dailynord.fr.txt ├── dailysabah.com.txt ├── dailystar.com.lb.txt ├── dallasnews.com.txt ├── danbooru.donmai.us.txt ├── danluu.com.txt ├── dansdata.com.txt ├── dantri.com.vn.txt ├── daringfireball.net.txt ├── daserste.ndr.de.txt ├── dasgelbeblatt.de.txt ├── davidwalsh.name.txt ├── dazeddigital.com.txt ├── dbazi.com.txt ├── dcurt.is.txt ├── deadline.com.txt ├── deadspin.com.txt ├── declassifieduk.org.txt ├── defenseone.com.txt ├── deia.com.txt ├── deichstube.de.txt ├── deliverydoubled.com.txt ├── delong.typepad.com.txt ├── democracynow.org.txt ├── demorgen.be.txt ├── denikn.cz.txt ├── der-postillon.com.txt ├── derbund.ch.txt ├── derekseaman.com.txt ├── derstandard.at.txt ├── derstandard.de.txt ├── des-livres-pour-changer-de-vie.fr.txt ├── designsponge.com.txt ├── designtagebuch.de.txt ├── deutsche-apotheker-zeitung.de.txt ├── dev.to.txt ├── devblogs.microsoft.com.txt ├── developer.mozilla.org.txt ├── developers.facebook.com.txt ├── devlinsangle.blogspot.co.at.txt ├── dezeen.com.txt ├── diagonalperiodico.net.txt ├── dice.com.txt ├── dictionary.reference.com.txt ├── diepresse.com.txt ├── digg.com.txt ├── digiphoto.techbang.com.txt ├── digital-photography-school.com.txt ├── digitalcourage.de.txt ├── digitalfernsehen.de.txt ├── digitalforensics.com.txt ├── digitalkamera.de.txt ├── digitalspy.co.uk.txt ├── dilbert.com.txt ├── dinamalar.com.txt ├── disclose.ngo.txt ├── discuss.logseq.com.txt ├── dispatchesjournal.org.txt ├── dissentmagazine.org.txt ├── distributistreview.com.txt ├── dn.pt.txt ├── dn.se.txt ├── dobreprogramy.pl.txt ├── doc.rust-lang.org.txt ├── doc.rust-lang.ru.txt ├── doc.wallabag.org.txt ├── docs.opnsense.org.txt ├── dodgersway.com.txt ├── domo-blog.fr.txt ├── domusweb.it.txt ├── donnahay.com.au.txt ├── dorkly.com.txt ├── dou.ua.txt ├── douban.com.txt ├── doughellmann.com.txt ├── dpreview.com.txt ├── dr-b.io.txt ├── dr.dk.txt ├── drdobbs.com.txt ├── drgoulu.com.txt ├── drive2.ru.txt ├── dropbox.com.txt ├── drupal.org.txt ├── dummies.com.txt ├── dushumashang.com.txt ├── dw.com.txt ├── dzone.com.txt ├── earther.com.txt ├── eastoftheweb.com.txt ├── eatsmarter.de.txt ├── ebay.com.txt ├── ecetia.com.txt ├── echo-online.de.txt ├── echo24.de.txt ├── eckerd.edu.txt ├── econlog.econlib.org.txt ├── economichardship.org.txt ├── economie.gouv.fr.txt ├── economist.com.txt ├── ecranlarge.com.txt ├── edge-online.com.txt ├── edge.org.txt ├── edition.channel5belize.com.txt ├── edition.cnn.com.txt ├── edn.com.txt ├── eetimes.com.txt ├── eff.org.txt ├── einfach-tasty.de.txt ├── ekantipur.com.txt ├── ekultura.hu.txt ├── elance.com.txt ├── elblogsalmon.com.txt ├── elconfidencial.com.txt ├── elderscrollsonline.com.txt ├── eleconomista.es.txt ├── electrek.co.txt ├── electromaker.io.txt ├── elektroautomobil.com.txt ├── elektroniknet.de.txt ├── elementor.contentlabs.ca.txt ├── elespanol.com.txt ├── elfster.com.txt ├── elmalpensante.com.txt ├── elmundo.es.txt ├── elpais.com.txt ├── eltonjohn.com.txt ├── emaratalyoum.com.txt ├── en.espnf1.com.txt ├── engadget.com.txt ├── engineering.tumblr.com.txt ├── english.aljazeera.net.txt ├── enikos.gr.txt ├── enterprisersproject.com.txt ├── entertainment.timesonline.co.uk.txt ├── entheogenesis.org.txt ├── entrepreneurshandbook.co.txt ├── entwickler.de.txt ├── enviscope.com.txt ├── ericsuh.com.txt ├── ernestmag.fr.txt ├── escapistmagazine.com.txt ├── esglobal.org.txt ├── espacepolitique.revues.org.txt ├── espn.go.com.txt ├── esquire.com.txt ├── esslinger-zeitung.de.txt ├── essonneinfo.fr.txt ├── estadao.com.br.txt ├── eternabuenosaires.com.txt ├── euractiv.com.txt ├── euractiv.fr.txt ├── eurogamer.net.txt ├── everydayfeminism.com.txt ├── evo.co.uk.txt ├── eweek.com.txt ├── exoplanets.nasa.gov.txt ├── explainthatstuff.com.txt ├── explosm.net.txt ├── expresso.sapo.pt.txt ├── extracine.com.txt ├── extratipp.com.txt ├── f-droid.org.txt ├── facebook.com.txt ├── facta.co.jp.txt ├── factuel.info.txt ├── fair.org.txt ├── fairphone.com.txt ├── fakirpresse.info.txt ├── falter.at.txt ├── fanfiction.net.txt ├── fastcompany.com.txt ├── faz.net.txt ├── feeds.feedblitz.com.txt ├── fehmarn24.de.txt ├── fernbahntunnel-frankfurt.de.txt ├── fertigung.de.txt ├── fictionpress.com.txt ├── ficwad.com.txt ├── fiftytwo.in.txt ├── filamentgroup.com.txt ├── filmstarts.de.txt ├── findtheswagger.tumblr.com.txt ├── finexpert.e15.cz.txt ├── fingerprint.ippen.media.txt ├── firstmonday.org.txt ├── firstthings.com.txt ├── fivebooks.com.txt ├── fivefilters.org.txt ├── fivethirtyeight.com.txt ├── flyingmachinestudios.com.txt ├── fm4.orf.at.txt ├── fmhy.net.txt ├── fnal.gov.txt ├── fnp.de.txt ├── focus-numerique.com.txt ├── focus.de.txt ├── fok.nl.txt ├── fokus.se.txt ├── foley.com.txt ├── folklore.org.txt ├── food.com.txt ├── fool.com.txt ├── forbes.com.txt ├── forbiddenstories.org.txt ├── foreignaffairs.com.txt ├── foreignpolicy.com.txt ├── formula1.com.txt ├── forsvaret.no.txt ├── fortelabs.co.txt ├── forward.com.txt ├── fossbytes.com.txt ├── foxnews.com.txt ├── fr.de.txt ├── framablog.org.txt ├── france24.com.txt ├── franceculture.fr.txt ├── frandroid.com.txt ├── frankenpost.de.txt ├── freecodecamp.org.txt ├── freelancer.com.txt ├── freemovement.org.uk.txt ├── fria.nu.txt ├── friatidningen.se.txt ├── frmplus.de.txt ├── fromreformationtoreformation.com.txt ├── frontburner.dmagazine.com.txt ├── frontpagelinux.com.txt ├── fs.blog.txt ├── ft.com.txt ├── ftchinese.com.txt ├── fularsizentellik.com.txt ├── fuldaerzeitung.de.txt ├── funnyjunk.com.txt ├── futura-sciences.com.txt ├── futurezone.at.txt ├── futurism.com.txt ├── fzone.cz.txt ├── gamasutra.com.txt ├── gameblog.fr.txt ├── gamedev.net.txt ├── gamekult.com.txt ├── gamer.no.txt ├── gamereactor.no.txt ├── gamesradar.com.txt ├── gameswirtschaft.de.txt ├── ganglia.info.txt ├── gatesnotes.com.txt ├── gatopardo.com.txt ├── gauchiste.fr.txt ├── gawker.com.txt ├── geeksofdoom.com.txt ├── geenstijl.nl.txt ├── generation-nt.com.txt ├── germangirlinamerica.com.txt ├── geschichtedergegenwart.ch.txt ├── getnews.jp.txt ├── getpocket.com.txt ├── ghanaweb.com.txt ├── giantbomb.com.txt ├── giessener-allgemeine.de.txt ├── giga.de.txt ├── gigaom.com.txt ├── gihyo.jp.txt ├── gist.github.com.txt ├── git-scm.com.txt ├── github.blog.txt ├── github.com.txt ├── gizmodo.com.au.txt ├── gizmodo.com.txt ├── gizmodo.uol.com.br.txt ├── gizmologia.com.txt ├── gizmovil.com.txt ├── glasnaya.media.txt ├── glazman.org.txt ├── global.txt ├── globalgrind.com.txt ├── globalissues.org.txt ├── globalresearch.ca.txt ├── gloswielkopolski.pl.txt ├── gnppn.fr.txt ├── gnz.de.txt ├── goal.com.txt ├── gocomics.com.txt ├── gofugyourself.com.txt ├── gokulkrishh.github.io.txt ├── gold.ac.uk.txt ├── goldseiten.de.txt ├── golem.de.txt ├── good.is.txt ├── goodfil.ms.txt ├── goodreads.com.txt ├── gorky.media.txt ├── gossip-tv.gr.txt ├── goteborgsfria.se.txt ├── gothamist.com.txt ├── gov.uk.txt ├── gp.se.txt ├── gq-magazine.co.uk.txt ├── gq.com.txt ├── grafikart.fr.txt ├── granta.com.txt ├── grantland.com.txt ├── greatergreaterwashington.org.txt ├── greaterwrong.com.txt ├── greensavers.sapo.pt.txt ├── groene.nl.txt ├── groups.drupal.org.txt ├── grubstreet.com.txt ├── grumpygamer.com.txt ├── gsmarena.com.txt ├── gulfnews.com.txt ├── guokr.com.txt ├── gurumed.org.txt ├── gurusblog.com.txt ├── guyaweb.com.txt ├── haaretz.co.il.txt ├── haaretz.com.txt ├── haberler.com.txt ├── habr.com.txt ├── habrahabr.ru.txt ├── hackersrepublic.org.txt ├── hackertarget.com.txt ├── hackmake.org.txt ├── hackneycitizen.co.uk.txt ├── hacks.mozilla.org.txt ├── hallo-muenchen.de.txt ├── halo.bungie.org.txt ├── hanau-wuerzburg-fulda.de.txt ├── hanauer.de.txt ├── handelsblatt.com.txt ├── hanselman.com.txt ├── happyassassin.net.txt ├── hardware.fr.txt ├── hardware.no.txt ├── hardwareluxx.de.txt ├── harpers.org.txt ├── harzkurier.de.txt ├── hazlitt.net.txt ├── hbr.org.txt ├── headrush.typepad.com.txt ├── health.com.txt ├── health.gov.au.txt ├── healthland.time.com.txt ├── healthletter.mayoclinic.com.txt ├── healthline.com.txt ├── heatmap.news.txt ├── heidelberg24.de.txt ├── heise.de.txt ├── hellofresh.de.txt ├── help.fivefilters.org.txt ├── hemmings.com.txt ├── hersfelder-zeitung.de.txt ├── hespress.com.txt ├── hessen.de.txt ├── hessenschau.de.txt ├── higcapital.com.txt ├── highscalability.com.txt ├── hiiraan.com.txt ├── hillstreetgrocer.com.txt ├── hindustantimes.com.txt ├── hiperpop.com.txt ├── hipertextual.com.txt ├── hiphopleeft.nl.txt ├── histoire-filante.fr.txt ├── histoire.presse.fr.txt ├── historic-uk.com.txt ├── historytoday.com.txt ├── hln.be.txt ├── hmercer.com.txt ├── hna.de.txt ├── hochheimer-zeitung.de.txt ├── hodinkee.com.txt ├── hollywoodlife.com.txt ├── hometheaterreview.com.txt ├── hosted.ap.org.txt ├── hosted2.ap.org.txt ├── houstonchronicle.com.txt ├── howtogeek.com.txt ├── hpd.de.txt ├── hs.fi.txt ├── ht.ly.txt ├── huffingtonpost.co.uk.txt ├── huffingtonpost.fr.txt ├── huffpost.com.txt ├── humanite.fr.txt ├── humantransit.org.txt ├── hurriyet.com.tr.txt ├── hvg.hu.txt ├── hypebeast.com.txt ├── ianlewis.org.txt ├── iansommerville.com.txt ├── icannabis.tumblr.com.txt ├── ichkoche.at.txt ├── ici.radio-canada.ca.txt ├── idealog.co.nz.txt ├── idlewords.com.txt ├── ieeexplore.ieee.org.txt ├── ietf.org.txt ├── igen.fr.txt ├── igeneration.fr.txt ├── ikz-online.de.txt ├── ilounge.com.txt ├── ilyabirman.ru.txt ├── immub.org.txt ├── imore.com.txt ├── in-muenchen.de.txt ├── inc.com.txt ├── indehekken.net.txt ├── independent.co.uk.txt ├── indiatimes.com.txt ├── indiehackers.com.txt ├── indiewire.com.txt ├── inessential.com.txt ├── infolibre.es.txt ├── infoq.com.txt ├── informador.com.mx.txt ├── information.dk.txt ├── informationarchitects.net.txt ├── informationclearinghouse.info.txt ├── informit.com.txt ├── infovaticana.com.txt ├── infoworld.com.txt ├── infzm.com.txt ├── ingame.de.txt ├── inhabitat.com.txt ├── innsalzach24.de.txt ├── inquirer.com.txt ├── inquirer.net.txt ├── instagr.am.txt ├── instructables.com.txt ├── insuedthueringen.de.txt ├── intelligenceonline.fr.txt ├── interconnected.org.txt ├── interestingengineering.com.txt ├── intern-mag.com.txt ├── interviewmagazine.com.txt ├── investigation.rollingstone.com.txt ├── investopedia.com.txt ├── inwestomat.eu.txt ├── ipadclub.nl.txt ├── ipadplanet.nl.txt ├── iphon.fr.txt ├── iphoneaddict.fr.txt ├── iphoneclub.nl.txt ├── iphonehacks.com.txt ├── iphonetweak.fr.txt ├── iplaysoft.com.txt ├── ishadeed.com.txt ├── iso.500px.com.txt ├── isource.com.txt ├── ispatguru.com.txt ├── it-connect.fr.txt ├── itavisen.no.txt ├── itmedia.co.jp.txt ├── itnews.com.au.txt ├── itsfoss.com.txt ├── itstactical.com.txt ├── itunes.apple.com.txt ├── itwire.com.txt ├── itworld.com.txt ├── izismile.com.txt ├── jacobin.com.txt ├── jalopnik.com.txt ├── jamesclear.com.txt ├── jameslandrith.com.txt ├── jamieoliver.com.txt ├── jandan.net.txt ├── japoninfos.com.txt ├── javascript.plainenglish.io.txt ├── javaworld.com.txt ├── jdubuzz.com.txt ├── je-suis-papa.com.txt ├── jesuisundev.com.txt ├── jetzt.de.txt ├── jetzt.sueddeutsche.de.txt ├── jeuxvideo.com.txt ├── jezebel.com.txt ├── jjahnke.net.txt ├── jneurosci.org.txt ├── jobbank.gc.ca.txt ├── joelonsoftware.com.txt ├── johannesbader.ch.txt ├── johnnysgamelogs.fr.txt ├── jollinger.com.txt ├── journal.markusthoma.com.txt ├── journaldugamer.com.txt ├── journaldugeek.com.txt ├── journals.plos.org.txt ├── journals.sagepub.com.txt ├── joystiq.com.txt ├── jpmens.net.txt ├── jsforcats.com.txt ├── juedische-allgemeine.de.txt ├── juejin.cn.txt ├── juliareda.eu.txt ├── julieandrieu.com.txt ├── jungle-world.com.txt ├── juppy.org.txt ├── jvns.ca.txt ├── jvt.me.txt ├── kachestvo.ru.txt ├── kathimerini.gr.txt ├── kattascha.de.txt ├── kb.mailbox.org.txt ├── kenfm.de.txt ├── kenrockwell.com.txt ├── keyboardmag.com.txt ├── keycloak.org.txt ├── kicker.de.txt ├── kickstarter.com.txt ├── kinder-verstehen.de.txt ├── kingarthurflour.com.txt ├── kingstonist.com.txt ├── kingz.fr.txt ├── klimareporter.de.txt ├── knoten-stadion.de.txt ├── knowablemagazine.org.txt ├── ko-fi.com.txt ├── kochbar.de.txt ├── kommersant.ru.txt ├── kont.me.txt ├── korben.info.txt ├── kotaku.com.txt ├── kottke.org.txt ├── kqed.org.txt ├── krautreporter.de.txt ├── krebsonsecurity.com.txt ├── kreis-anzeiger.de.txt ├── kreisbote.de.txt ├── kreiszeitung.de.txt ├── kresus.org.txt ├── kriswrites.com.txt ├── krone.at.txt ├── krzbb.de.txt ├── kuemmerle.name.txt ├── kulturegeek.fr.txt ├── kumailplus.com.txt ├── kumb.com.txt ├── kurier.de.txt ├── kurierverlag.de.txt ├── kwerfeldein.de.txt ├── labs.bishopfox.com.txt ├── labs.mwrinfosecurity.com.txt ├── labs.ripe.net.txt ├── lado.mx.txt ├── lalettrea.fr.txt ├── lalibre.be.txt ├── lampertheimer-zeitung.de.txt ├── landetsfria.se.txt ├── laphamsquarterly.org.txt ├── lapin-blanc.blogs.docteo.net.txt ├── lapresse.ca.txt ├── laquadrature.net.txt ├── lareviewofbooks.org.txt ├── larevuedesmedias.ina.fr.txt ├── latimes.com.txt ├── laughingsquid.com.txt ├── lauterbacher-anzeiger.de.txt ├── lawfareblog.com.txt ├── leancrew.com.txt ├── leb.fbi.gov.txt ├── leblogduhacker.fr.txt ├── lececil.org.txt ├── lecker.de.txt ├── ledauphine.com.txt ├── ledoc-info.com.txt ├── leereamsnyder.com.txt ├── lefigaro.fr.txt ├── lefilrouge.media.txt ├── legrandcontinent.eu.txt ├── lehollandaisvolant.net.txt ├── leinetal24.de.txt ├── lejournal.cnrs.fr.txt ├── lemmy.ml.txt ├── lemonde.fr.txt ├── lenta.ru.txt ├── lepoint.fr.txt ├── lequatreheures.com.txt ├── lequipe.fr.txt ├── lesecolohumanistes.fr.txt ├── lesjours.fr.txt ├── lesnumeriques.com.txt ├── lesoir.be.txt ├── lesprosdelapetiteenfance.fr.txt ├── lesswrong.com.txt ├── letraslibres.com.txt ├── lexpress.fr.txt ├── lezephyrmag.com.txt ├── libcom.org.txt ├── liberation.fr.txt ├── lifeclub.org.txt ├── lifehack.org.txt ├── lifehacker.com.txt ├── lifestyle.inquirer.net.txt ├── lifeweek.com.cn.txt ├── lightreading.com.txt ├── limprevu.fr.txt ├── link.springer.com.txt ├── linkedin.com.txt ├── linux-community.de.txt ├── linux-magazin.de.txt ├── linux.com.txt ├── linuxconfig.org.txt ├── linuxjournal.com.txt ├── linuxnix.com.txt ├── literaryreview.co.uk.txt ├── lithub.com.txt ├── livescience.com.txt ├── longform.org.txt ├── longreads.com.txt ├── longreads.tni.org.txt ├── loopinsight.com.txt ├── lostgarden.com.txt ├── lotro.com.txt ├── lowtechmagazine.com.txt ├── lrb.co.uk.txt ├── ludwigshafen24.de.txt ├── lukew.com.txt ├── luminous-landscape.com.txt ├── lupa.cz.txt ├── lux-magazine.com.txt ├── luxuo.com.txt ├── lvsl.fr.txt ├── lwlies.com.txt ├── lwn.net.txt ├── lynalden.com.txt ├── m.bbc.co.uk.txt ├── m.douban.com.txt ├── m.dw.com.txt ├── m.facebook.com.txt ├── m.theregister.co.uk.txt ├── m.wikihow.com.txt ├── m.xkcd.com.txt ├── m00natic.github.io.txt ├── mac4ever.com.txt ├── macdrifter.com.txt ├── macg.co.txt ├── macmagazine.com.br.txt ├── macrumors.com.txt ├── macstories.net.txt ├── mactalk.com.au.txt ├── mactechnews.de.txt ├── macworld.com.txt ├── mailchi.mp.txt ├── main-spitze.de.txt ├── mainpost.de.txt ├── maitre-eolas.fr.txt ├── make.wordpress.org.txt ├── makramayache.com.txt ├── malekal.com.txt ├── manager-magazin.de.txt ├── manager.co.th.txt ├── manga-news.com.txt ├── mangfall24.de.txt ├── mannheim24.de.txt ├── marciniwuc.com.txt ├── marco.org.txt ├── marcobehler.com.txt ├── marcvidal.net.txt ├── marginalrevolution.com.txt ├── marigold.cz.txt ├── maritimedanmark.dk.txt ├── marketresearchdirect.com.txt ├── markmanson.net.txt ├── marksdailyapple.com.txt ├── marktechpost.com.txt ├── marmiton.org.txt ├── marriedtothesea.com.txt ├── marsactu.fr.txt ├── martinfowler.com.txt ├── mashable.com.txt ├── matija.suklje.name.txt ├── matt.might.net.txt ├── mattcutts.com.txt ├── matthewball.co.txt ├── maxim.com.txt ├── mbari.org.txt ├── mbk-news.appspot.com.txt ├── mbl.is.txt ├── mcconnellsmedchem.com.txt ├── mcorbin.fr.txt ├── mdpi.com.txt ├── mdr.de.txt ├── mebedo.de.txt ├── mediacites.fr.txt ├── medialens.org.txt ├── mediapart.fr.txt ├── medium.com.txt ├── medscape.com.txt ├── meduza.io.txt ├── megamp3.eu.txt ├── mein-hbf-ffm.de.txt ├── mein-mmo.de.txt ├── meine-anzeigenzeitung.de.txt ├── mentalfloss.com.txt ├── meowni.ca.txt ├── mercatornet.com.txt ├── mercurynews.com.txt ├── merkur.de.txt ├── merkurist.de.txt ├── mesec.cz.txt ├── metafilter.com.txt ├── metro.co.uk.txt ├── metrocop.net.txt ├── mforum.cari.com.my.txt ├── miamiherald.com.txt ├── microsiervos.com.txt ├── middleeasteye.net.txt ├── mikeash.com.txt ├── mikeindustries.com.txt ├── minnesota.publicradio.org.txt ├── minnpost.com.txt ├── mintpressnews.com.txt ├── miops.com.txt ├── mirrorfootball.co.uk.txt ├── mises.org.txt ├── missnumerique.com.txt ├── mithatkonar.com.txt ├── mitie.com.txt ├── mittelhessen.de.txt ├── mlb.sbnation.com.txt ├── mlssoccer.com.txt ├── mmo-champion.com.txt ├── mnn.com.txt ├── mno.hu.txt ├── mobile.lemondeinformatique.fr.txt ├── mobile.nytimes.com.txt ├── mobile.twitter.com.txt ├── mobilegeeks.de.txt ├── mobilenet.cz.txt ├── mobileopportunity.blogspot.com.txt ├── mobilmania.cz.txt ├── modernghana.com.txt ├── momentumsaga.com.txt ├── monde-diplomatique.fr.txt ├── money.cnn.com.txt ├── moneysavingexpert.com.txt ├── monkeyuser.com.txt ├── monkeyzen.com.txt ├── montelimar-news.fr.txt ├── moo.nac.uci.edu.txt ├── moonsault.de.txt ├── morgenpost.de.txt ├── mothering.com.txt ├── motherjones.com.txt ├── moto-net.com.txt ├── motorcyclistonline.com.txt ├── motorfull.com.txt ├── motorsport-magazin.com.txt ├── movie.douban.com.txt ├── mp.weixin.qq.com.txt ├── msdn.microsoft.com.txt ├── msdvetmanual.com.txt ├── msn.com.txt ├── msnbc.msn.com.txt ├── mtlblog.com.txt ├── muenster.de.txt ├── multinationales.org.txt ├── muse.jhu.edu.txt ├── muycomputerpro.com.txt ├── muyinteresante.com.txt ├── muyinteresante.es.txt ├── muylinux.com.txt ├── mymodernmet.com.txt ├── myrecipes.com.txt ├── mysqlblog.fivefarmers.com.txt ├── mytotalretail.com.txt ├── n-tv.de.txt ├── n.survol.fr.txt ├── nachdenkseiten.de.txt ├── nachrichten.at.txt ├── naiz.eus.txt ├── najlepsze-ksiazki.pl.txt ├── nakedsecurity.sophos.com.txt ├── narratively.com.txt ├── nasa.gov.txt ├── nationalgeographic.de.txt ├── nationalpost.com.txt ├── nationalreview.com.txt ├── natura-sciences.com.txt ├── nature.com.txt ├── nbnnews.com.au.txt ├── ncbi.nlm.nih.gov.txt ├── nejm.org.txt ├── net-security.org.txt ├── netflixtechblog.com.txt ├── netmagazine.com.txt ├── networkworld.com.txt ├── netzoekonom.de.txt ├── netzpolitik.org.txt ├── neues-deutschland.de.txt ├── neunetz.com.txt ├── newcriterion.com.txt ├── newmedia.calcalist.co.il.txt ├── newrepublic.com.txt ├── news.bayern.txt ├── news.cnet.com.txt ├── news.com.au.txt ├── news.detik.com.txt ├── news.google.com.txt ├── news.mynavi.jp.txt ├── news.pixelistes.com.txt ├── news.rambler.ru.txt ├── news.rub.de.txt ├── news.techmeme.com.txt ├── news.ycombinator.com.txt ├── news247.gr.txt ├── newsbomb.gr.txt ├── newsinfo.inquirer.net.txt ├── newsletter.pragmaticengineer.com.txt ├── newstatesman.com.txt ├── newsunspun.org.txt ├── newsweek.com.txt ├── newswise.com.txt ├── newtimesslo.com.txt ├── newyorker.com.txt ├── next.ink.txt ├── nextcloud.com.txt ├── nextdraft.com.txt ├── nf-farn.de.txt ├── nfl.com.txt ├── nicj.net.txt ├── nifi.apache.org.txt ├── nintendoworldreport.com.txt ├── nitter.net.txt ├── nj.com.txt ├── noidea.dog.txt ├── nojesguiden.se.txt ├── nordmainische-s-bahn.de.txt ├── northumberlandview.ca.txt ├── nos.nl.txt ├── nosalty.hu.txt ├── nota-bene.org.txt ├── notebookcheck.net.txt ├── notimx.mx.txt ├── nouvelobs.com.txt ├── novastan.org.txt ├── novinky.cz.txt ├── np-coburg.de.txt ├── nplusonemag.com.txt ├── npr.org.txt ├── nrc.nl.txt ├── nrz.de.txt ├── ntoskrnl.org.txt ├── numerama.com.txt ├── nybooks.com.txt ├── nymag.com.txt ├── nytimes.com.txt ├── nzz.ch.txt ├── o6asan.com.txt ├── oberhessische-zeitung.de.txt ├── observers.france24.com.txt ├── ocu.org.txt ├── off.net.mk.txt ├── oko.press.txt ├── oktoberfest.bayern.txt ├── oltnertagblatt.ch.txt ├── omgubuntu.co.uk.txt ├── omiliya.org.txt ├── onb.ac.at.txt ├── oncletom.io.txt ├── onlinewelten.com.txt ├── ontologicalgeek.com.txt ├── op-online.de.txt ├── open.online.txt ├── openai.com.txt ├── opendemocracy.net.txt ├── opensource.com.txt ├── opensource.org.txt ├── openstreetmap.org.txt ├── openthemagazine.com.txt ├── optimizesmart.com.txt ├── orf.at.txt ├── orientxxi.info.txt ├── origo.hu.txt ├── oschina.net.txt ├── osmand.net.txt ├── osmc.tv.txt ├── ostechnix.com.txt ├── ostprog.de.txt ├── otz.de.txt ├── ourworldindata.org.txt ├── outsideonline.com.txt ├── ovb-online.de.txt ├── oxfordamerican.org.txt ├── paddle.com.txt ├── pagenotfound.cz.txt ├── palmbeachpost.com.txt ├── pandemicequityinitiative.com.txt ├── pandodaily.com.txt ├── panic.com.txt ├── paperpaper.ru.txt ├── papertohtml.org.txt ├── papodehomem.com.br.txt ├── paquier.xyz.txt ├── parislemon.com.txt ├── parliament.uk.txt ├── parool.nl.txt ├── pastebin.com.txt ├── pastepad.fivefilters.org.txt ├── pathawks.com.txt ├── patreon.com.txt ├── pcgamer.com.txt ├── pcmag.com.txt ├── pcworld.com.txt ├── penny-arcade.com.txt ├── pentaxforums.com.txt ├── peoplesdispatch.org.txt ├── perell.com.txt ├── perspective-daily.de.txt ├── pestemag.com.txt ├── pfefferminzia.de.txt ├── pflegen-online.de.txt ├── pharmazeutische-zeitung.de.txt ├── phastidio.net.txt ├── philosophyforlife.org.txt ├── philosophynow.org.txt ├── philstar.com.txt ├── phoronix.com.txt ├── photo.tutsplus.com.txt ├── photografix-magazin.de.txt ├── photopills.com.txt ├── phototrend.fr.txt ├── php.net.txt ├── phys.org.txt ├── pinterest.com.txt ├── piped.video.txt ├── pitchfork.com.txt ├── pittsburghmagazine.com.txt ├── pixellibre.net.txt ├── pjmedia.com.txt ├── placegrenet.fr.txt ├── planet3dnow.de.txt ├── planetvita.de.txt ├── playboy.com.txt ├── playgroupnsw.org.au.txt ├── ploum.net.txt ├── pluralistic.net.txt ├── plus.google.com.txt ├── plus.lesoir.be.txt ├── plzkthxbai.com.txt ├── pmf.silvrback.com.txt ├── poetryfoundation.org.txt ├── pogue.blogs.nytimes.com.txt ├── politico.com.txt ├── politifact.com.txt ├── politiken.dk.txt ├── politis.fr.txt ├── polka.academy.txt ├── polygon.com.txt ├── popehat.com.txt ├── popsci.com.txt ├── popularmechanics.com.txt ├── portertech.ca.txt ├── positioningmag.com.txt ├── posta.com.tr.txt ├── posteo.de.txt ├── postnauka.ru.txt ├── preparedfoods.com.txt ├── presse-citron.net.txt ├── presseportal.de.txt ├── privacyinternational.org.txt ├── pro-linux.de.txt ├── prog21.dadgum.com.txt ├── prolost.com.txt ├── propakistani.pk.txt ├── propublica.org.txt ├── proskauer.com.txt ├── prospectmagazine.co.uk.txt ├── protocol.com.txt ├── protonmail.com.txt ├── protothema.gr.txt ├── psu.edu.txt ├── psyche.co.txt ├── psychologytoday.com.txt ├── psypost.org.txt ├── publications.aap.org.txt ├── publications.parliament.uk.txt ├── publicdomainreview.org.txt ├── publico.pt.txt ├── puri.sm.txt ├── putaindecode.io.txt ├── putsch.media.txt ├── pxlnv.com.txt ├── pymotw.com.txt ├── python.org.txt ├── qctimes.com.txt ├── qntm.org.txt ├── quantamagazine.org.txt ├── quantumdiaries.org.txt ├── quechoisir.org.txt ├── queerty.com.txt ├── questionablecontent.net.txt ├── queue.acm.org.txt ├── quickanddirtytips.com.txt ├── quora.com.txt ├── qz.com.txt ├── rachelandrew.co.uk.txt ├── racjonalista.pl.txt ├── radar.oreilly.com.txt ├── radionz.co.nz.txt ├── radishzz.cc.txt ├── rancher.com.txt ├── randsinrepose.com.txt ├── rasgolatente.es.txt ├── rbb24.de.txt ├── reactjs.org.txt ├── readingthechinadream.com.txt ├── real.gr.txt ├── rebelionenlagranja.com.txt ├── rebooti.com.txt ├── recode.net.txt ├── redalemeden.com.txt ├── redbull.com.txt ├── reddit.com.txt ├── redeszone.net.txt ├── redmas.com.co.txt ├── redmondpie.com.txt ├── redtimmy.com.txt ├── refinery29.com.txt ├── reflets.info.txt ├── regionaltangente-west.de.txt ├── reitschuster.de.txt ├── renenekuda.cz.txt ├── renverse.co.txt ├── report-k.de.txt ├── reportermagazin.cz.txt ├── reporterre.net.txt ├── researchandmarkets.com.txt ├── researchgate.net.txt ├── resilience.org.txt ├── retractionwatch.com.txt ├── retro-games.fr.txt ├── reuters.com.txt ├── revdennismccarty.com.txt ├── revue-farouest.fr.txt ├── rework.withgoogle.com.txt ├── rezeptwelt.de.txt ├── rfi.fr.txt ├── rhein-kreis-neuss.de.txt ├── richardkmorgan.com.txt ├── riedbahn.de.txt ├── riffreporter.de.txt ├── ritimo.org.txt ├── rnd.de.txt ├── robertsspaceindustries.com.txt ├── robots.thoughtbot.com.txt ├── rockpapershotgun.com.txt ├── rockylinux.org.txt ├── rodrigo.sharpcube.com.txt ├── rogerebert.com.txt ├── rollingstone.com.txt ├── rom-game.fr.txt ├── romchip.org.txt ├── roomescapeartist.com.txt ├── root.cz.txt ├── rosenheim24.de.txt ├── rottentomatoes.com.txt ├── roughtype.com.txt ├── roy.gbiv.com.txt ├── royalsocietypublishing.org.txt ├── rpgsite.net.txt ├── rtbf.be.txt ├── rtings.com.txt ├── rubysfera.pl.txt ├── rugbyrama.fr.txt ├── ruhlman.com.txt ├── ruhr24.de.txt ├── rums.ms.txt ├── rust-lang-nursery.github.io.txt ├── s6-frankfurt-friedberg.de.txt ├── saadaalnews.net.txt ├── sacbee.com.txt ├── salon.com.txt ├── saltyworld.net.txt ├── salzburg.com.txt ├── san.com.txt ├── sanpedrosun.com.txt ├── sapiens.org.txt ├── sargasso.nl.txt ├── sauerlandkurier.de.txt ├── saveyourself.ca.txt ├── sayidaty.net.txt ├── sbnation.com.txt ├── scheuch.de.txt ├── schneier.com.txt ├── schwarzwaelder-bote.de.txt ├── science.org.txt ├── scienceblogs.de.txt ├── sciencedirect.com.txt ├── scienceticker.info.txt ├── scientificamerican.com.txt ├── scilogs.de.txt ├── scinfolex.com.txt ├── scnsrc.me.txt ├── scotthelme.co.uk.txt ├── scottohara.me.txt ├── scotusblog.com.txt ├── scripting.com.txt ├── scroll.in.txt ├── sdxcentral.com.txt ├── searchenginejournal.com.txt ├── searchengineland.com.txt ├── seattletimes.com.txt ├── seattletransitblog.com.txt ├── sebsauvage.net.txt ├── secouchermoinsbete.fr.txt ├── secretmag.ru.txt ├── securelist.com.txt ├── securityaffairs.co.txt ├── securitylab.ru.txt ├── secushare.org.txt ├── segment.com.txt ├── select.yeeyan.org.txt ├── semiaccurate.com.txt ├── seriouseats.com.txt ├── serpentinegalleries.org.txt ├── servethehome.com.txt ├── seznamzpravy.cz.txt ├── sf.eater.com.txt ├── sfgate.com.txt ├── sfweekly.com.txt ├── shabayek.com.txt ├── shahinkalantari.com.txt ├── share.ez.no.txt ├── shawnblanc.net.txt ├── shepherd.com.txt ├── shifteleven.com.txt ├── shipilev.net.txt ├── shz.de.txt ├── siecledigital.fr.txt ├── signal.org.txt ├── singaporeanstocksinvestor.blogspot.com.txt ├── singularityhub.com.txt ├── sivers.org.txt ├── slashdot.org.txt ├── slashfilm.com.txt ├── slate.com.txt ├── slate.fr.txt ├── slice.seriouseats.com.txt ├── slog.thestranger.com.txt ├── slrlounge.com.txt ├── smarthomebeginner.com.txt ├── smashingmagazine.com.txt ├── smbc-comics.com.txt ├── sme.sk.txt ├── smh.com.au.txt ├── smithsonianmag.com.txt ├── snip.ly.txt ├── snob.ru.txt ├── soester-anzeiger.de.txt ├── somethingawful.com.txt ├── songshuhui.net.txt ├── soundcity.tv.txt ├── soundonsound.com.txt ├── sourcebooks.com.txt ├── sowetanlive.co.za.txt ├── spectator.co.uk.txt ├── spectrejournal.com.txt ├── spectrum.ieee.org.txt ├── spektrum.de.txt ├── spiderum.com.txt ├── spiegel.de.txt ├── spiked-online.com.txt ├── spin.com.txt ├── splinternews.com.txt ├── sport.detik.com.txt ├── sport365.fr.txt ├── sports.ru.txt ├── sprengsatz.de.txt ├── sputniknews.com.txt ├── sqlite.org.txt ├── squashed.tumblr.com.txt ├── src └── Files.php ├── srf.ch.txt ├── stackoverflow.blog.txt ├── stackoverflow.com.txt ├── stadt-bremerhaven.de.txt ├── stadt-muenster.de.txt ├── stadtpost.de.txt ├── staltz.com.txt ├── standard.co.uk.txt ├── star-telegram.com.txt ├── statista.com.txt ├── steamcommunity.com.txt ├── stefanjudis.com.txt ├── stephenfry.com.txt ├── stjv.fr.txt ├── stockholmsfria.se.txt ├── stopgame.ru.txt ├── straightdope.com.txt ├── straitstimes.com.txt ├── stratfor.com.txt ├── streetsblog.net.txt ├── stuff.co.nz.txt ├── stumbleupon.com.txt ├── stuttgarter-nachrichten.de.txt ├── stuttgarter-zeitung.de.txt ├── substack.com.txt ├── subtraction.com.txt ├── sueddeutsche.de.txt ├── sulek.fr.txt ├── summitroute.com.txt ├── sun-connect.org.txt ├── sunshinecoastdaily.com.au.txt ├── supchina.com.txt ├── superuser.openinfra.dev.txt ├── svd.se.txt ├── svt.se.txt ├── swcarpentry.github.io.txt ├── swissinfo.ch.txt ├── switchonpaper.com.txt ├── sydsvenskan.se.txt ├── symmetrymagazine.org.txt ├── symphozik.info.txt ├── synbioz.com.txt ├── sz-magazin.sueddeutsche.de.txt ├── t-online.de.txt ├── t3n.de.txt ├── t3terminal.com.txt ├── tabletmag.com.txt ├── tagblatt.de.txt ├── tagesanzeiger.ch.txt ├── tagesschau.de.txt ├── tagesspiegel.de.txt ├── takt-magazin.de.txt ├── taste.com.au.txt ├── tasteofhome.com.txt ├── taz.de.txt ├── tbray.org.txt ├── teamliquid.net.txt ├── tech.sina.com.cn.txt ├── techcommunity.microsoft.com.txt ├── techcrunch.com.txt ├── techdirt.com.txt ├── techhive.com.txt ├── techmeme.com.txt ├── techno-science.net.txt ├── technologizer.com.txt ├── technologyreview.com.txt ├── techpinions.com.txt ├── techradar.com.txt ├── techstage.de.txt ├── ted.com.txt ├── telegraph.co.uk.txt ├── telepolis.de.txt ├── telerama.fr.txt ├── tennis.com.txt ├── terrestres.org.txt ├── texasmonthly.com.txt ├── the-magazine.org.txt ├── the-scientist.com.txt ├── the-tls.co.uk.txt ├── theage.com.au.txt ├── theamericanscholar.org.txt ├── theathletic.com.txt ├── theatlantic.com.txt ├── theatlanticcities.com.txt ├── thebaffler.com.txt ├── theblueprint.ru.txt ├── thebulletin.org.txt ├── thecitypaperbogota.com.txt ├── thecounter.org.txt ├── thecreativeindependent.com.txt ├── thecut.com.txt ├── thedailybeast.com.txt ├── thedailymash.co.uk.txt ├── thedisneyblog.com.txt ├── thedrive.com.txt ├── thefader.com.txt ├── thefilmexperience.net.txt ├── theflaw.org.txt ├── thegamedesignforum.com.txt ├── thegap.at.txt ├── theglobalmail.org.txt ├── thegreatdiscontent.com.txt ├── theguardian.com.txt ├── thehansindia.com.txt ├── thehindu.com.txt ├── theins.ru.txt ├── theintercept.com.txt ├── theinventory.com.txt ├── thekitchn.com.txt ├── them.us.txt ├── themarker.com.txt ├── themillions.com.txt ├── thenation.com.txt ├── thenetworkgarden.blogs.com.txt ├── thenewatlantis.com.txt ├── thenewdaily.com.au.txt ├── thenews.coop.txt ├── thenewstribune.com.txt ├── thenextgeneration.org.txt ├── thenextweb.com.txt ├── theoaklandpress.com.txt ├── theodinproject.com.txt ├── theonion.com.txt ├── theoutline.com.txt ├── theplayerstribune.com.txt ├── thepointmag.com.txt ├── theregister.co.uk.txt ├── theregister.com.txt ├── theringer.com.txt ├── theroot.com.txt ├── therumpus.net.txt ├── thesaturdaypaper.com.au.txt ├── theses.enc.sorbonne.fr.txt ├── thesimpledollar.com.txt ├── theskepticalcardiologist.com.txt ├── thesocialitefamily.com.txt ├── thespoof.com.txt ├── thestranger.com.txt ├── thesun.co.uk.txt ├── thetakeout.com.txt ├── theteaspot.com.txt ├── thethaovanhoa.vn.txt ├── thetimes.co.uk.txt ├── thetorah.com.txt ├── theverge.com.txt ├── theweek.com.txt ├── thewirecutter.com.txt ├── thingiverse.com.txt ├── thinkspot.com.txt ├── thinkwithgoogle.com.txt ├── thisamericanlife.org.txt ├── thisiscolossal.com.txt ├── thoughtco.com.txt ├── threadreaderapp.com.txt ├── threatpost.com.txt ├── thrillist.com.txt ├── thueringer-allgemeine.de.txt ├── ticket.interpark.com.txt ├── tidbits.com.txt ├── tijd.be.txt ├── time.com.txt ├── timeshighereducation.co.uk.txt ├── timeshighereducation.com.txt ├── tipb.com.txt ├── titanic-magazin.de.txt ├── tldp.org.txt ├── tlz.de.txt ├── tnr.com.txt ├── tobias-hartmann.net.txt ├── tofugu.com.txt ├── tomdispatch.com.txt ├── tomsguide.com.txt ├── tomshardware.com.txt ├── tomshardware.de.txt ├── toolinux.com.txt ├── toolsandtoys.net.txt ├── torn.com.txt ├── torontolife.com.txt ├── touilleur-express.fr.txt ├── tourmag.com.txt ├── touteduc.fr.txt ├── towardsdatascience.com.txt ├── towerofthehand.com.txt ├── tracks.ranea.org.txt ├── tradingforaliving.pl.txt ├── trailer.web-view.net.txt ├── trailers.apple.com.txt ├── trailerzone.de.txt ├── traningslara.se.txt ├── trendmicro.com.txt ├── triblive.com.txt ├── triple-c.at.txt ├── triplebyte.com.txt ├── trouw.nl.txt ├── troyhunt.com.txt ├── trustedreviews.com.txt ├── truthdig.com.txt ├── truthout.org.txt ├── tthfanfic.org.txt ├── tuaw.com.txt ├── tuhdo.github.io.txt ├── turnoff.us.txt ├── tvline.com.txt ├── tvtropes.org.txt ├── tweakers.net.txt ├── twitter.com.txt ├── twog.fr.txt ├── typo3.com.txt ├── typo3.org.txt ├── tz.de.txt ├── ubuntugeek.com.txt ├── udn.com.txt ├── uefa.com.txt ├── uk.xbox360.ign.com.txt ├── uncannymagazine.com.txt ├── unherd.com.txt ├── uni-watch.com.txt ├── universe.shelfd.com.txt ├── unsertirol24.com.txt ├── unwinnable.com.txt ├── uol.com.br.txt ├── urbandictionary.com.txt ├── us-cert.gov.txt ├── usatoday.com.txt ├── usbeketrica.com.txt ├── useit.com.txt ├── usenix.org.txt ├── utcc.utoronto.ca.txt ├── utdailybeacon.com.txt ├── utiliser-lightroom.com.txt ├── utux.fr.txt ├── ux.artu.tv.txt ├── uxdesign.cc.txt ├── vakarm.net.txt ├── valdaiclub.com.txt ├── vanityfair.com.txt ├── variety.com.txt ├── varsity.co.uk.txt ├── vc.ru.txt ├── vedonlyonti.com.txt ├── velomotion.de.txt ├── venturebeat.com.txt ├── verlagshaus-jaumann.de.txt ├── version2.dk.txt ├── verybestbaking.com.txt ├── vg.no.txt ├── viaoccitanie.tv.txt ├── vice.com.txt ├── videogum.com.txt ├── vienna.at.txt ├── viget.com.txt ├── villagevoice.com.txt ├── vimeo.com.txt ├── vincent.jousse.org.txt ├── viply.de.txt ├── virten.net.txt ├── visir.is.txt ├── visual-planning.com.txt ├── visualcapitalist.com.txt ├── vitispr.com.txt ├── vivirmexico.com.txt ├── vk.com.txt ├── vogue.co.uk.txt ├── vogue.com.txt ├── voices.washingtonpost.com.txt ├── voidstern.net.txt ├── volksfest-freising.de.txt ├── volkskrant.nl.txt ├── voltairenet.org.txt ├── vot-tak.tv.txt ├── vox.com.txt ├── voxeurop.eu.txt ├── vozpopuli.com.txt ├── vr-zone.com.txt ├── vrt.be.txt ├── vulture.com.txt ├── w3.org.txt ├── wa.de.txt ├── wallabag.org.txt ├── warnerbros.fr.txt ├── warriordudimanche.net.txt ├── washingtoninstitute.org.txt ├── washingtonmonthly.com.txt ├── washingtonpost.com.txt ├── wasserburg24.de.txt ├── watchlist-internet.at.txt ├── watoday.com.au.txt ├── watson.ch.txt ├── watson.de.txt ├── waz.de.txt ├── web-libre.org.txt ├── web.dev.txt ├── weblogs.asp.net.txt ├── webupd8.org.txt ├── wellcome.org.txt ├── wellcomecollection.org.txt ├── welt.de.txt ├── wenow.com.txt ├── werra-rundschau.de.txt ├── westernadvocate.com.au.txt ├── wetterauer-zeitung.de.txt ├── what-if.xkcd.com.txt ├── whatever.scalzi.com.txt ├── wienerzeitung.at.txt ├── wiesbadener-kurier.de.txt ├── wiesn.bayern.txt ├── wiki.guildwars.com.txt ├── wiki.guildwars2.com.txt ├── wikihow.com.txt ├── wikitravel.org.txt ├── wikiwand.com.txt ├── will-self.com.txt ├── winfuture.de.txt ├── wired.co.uk.txt ├── wired.com.txt ├── wired.jp.txt ├── wiwo.de.txt ├── wlz-online.de.txt ├── wmpoweruser.com.txt ├── wn.de.txt ├── wochenanzeiger.de.txt ├── woman.tvbs.com.tw.txt ├── woolworths.com.au.txt ├── wordpress.org.txt ├── wordswithoutborders.org.txt ├── wordyard.com.txt ├── world.hey.com.txt ├── worldcrunch.com.txt ├── worldpoultry.net.txt ├── worldwidewords.org.txt ├── wormser-zeitung.de.txt ├── wornandwound.com.txt ├── woshub.com.txt ├── wow.joystiq.com.txt ├── wp.de.txt ├── wpbeginner.com.txt ├── wphive.com.txt ├── wpmayor.com.txt ├── wr.de.txt ├── writerunboxed.com.txt ├── wsj.com.txt ├── wsws.org.txt ├── www.blueapron.com.txt ├── www.seriouseats.com.txt ├── www1.folha.uol.com.br.txt ├── www2.cnrs.fr.txt ├── wyborcza.biz.txt ├── wyborcza.pl.txt ├── wysokieobcasy.pl.txt ├── wz-newsline.de.txt ├── xataka.com.txt ├── xatakaciencia.com.txt ├── xatakamovil.com.txt ├── xda-developers.com.txt ├── xlsemanal.com.txt ├── xm.com.txt ├── xn--protin-bva.com.txt ├── yahoo.com.txt ├── ycombinator.com.txt ├── ynet.co.il.txt ├── yosoy.red.txt ├── yostivanich.com.txt ├── yourerie.com.txt ├── youtube.com.txt ├── zaknrw.de.txt ├── zataz.com.txt ├── zdf.de.txt ├── zdnet.com.txt ├── zdopravy.cz.txt ├── ze.tt.txt ├── zeit.de.txt ├── zerohedge.com.txt ├── zerokspot.com.txt ├── zetland.dk.txt ├── zhihu.com.txt ├── zhuanlan.zhihu.com.txt ├── zinio.com.txt ├── zive.cz.txt ├── zoomit.ir.txt └── zwiftinsider.com.txt /.about.com.txt: -------------------------------------------------------------------------------- 1 | title: //*[@id='title']//h1 2 | body: //*[(@id = "articlebody")] 3 | test_url: http://nutrition.about.com/od/changeyourdiet/qt/healthysnacks.htm -------------------------------------------------------------------------------- /.allthingsd.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content-left']/div[@class='post'] 2 | strip_id_or_class: social 3 | strip_id_or_class: atd-disqus-disclaimer 4 | tidy: no 5 | 6 | test_url: http://mediamemo.allthingsd.com/20110516/bit-ly-gets-a-new-boss/ -------------------------------------------------------------------------------- /.craigslist.org.txt: -------------------------------------------------------------------------------- 1 | title: //h2[@class='postingtitle'] 2 | date: //p[@class='postinginfo']/date 3 | 4 | body: //figure[@class='iw'] | //section[@class='cltags' or @id='postingbody'] 5 | prune: no 6 | tidy: no 7 | 8 | test_url: http://sfbay.craigslist.org/hhh/index.rss -------------------------------------------------------------------------------- /.dxy.cn.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content'] 2 | prune: no 3 | 4 | test_url: http://neurosurg.dxy.cn/article/87224 -------------------------------------------------------------------------------- /.fivefilters.org.txt: -------------------------------------------------------------------------------- 1 | # Pastepad specific 2 | title: //div[@id='ff-pastepad-content']//h1 3 | body: //div[@id='ff-pastepad-content'] 4 | prune: no 5 | # todo: add test file 6 | test_url: http://pastepad.fivefilters.org/test.html 7 | -------------------------------------------------------------------------------- /.ietf.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content'] 2 | date: //time/@datetime 3 | 4 | insert_detected_image: no 5 | 6 | strip_id_or_class: pilcrow 7 | 8 | prune: no 9 | 10 | test_url: https://datatracker.ietf.org/doc/html/draft-ietf-oauth-sd-jwt-vc-01 11 | -------------------------------------------------------------------------------- /.livejournal.com.txt: -------------------------------------------------------------------------------- 1 | title: //title 2 | strip_image_src: 'l-stat.livejournal.com' 3 | strip_image_src: 'www.livejournal.com' 4 | strip_image_src: 'l-userpic.livejournal.com' 5 | test_url: http://news.livejournal.com/136664.html 6 | test_url: http://stelazin.livejournal.com/91363.html -------------------------------------------------------------------------------- /.mitpress.mit.edu.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: wp-block-pullquote 2 | 3 | test_url: https://thereader.mitpress.mit.edu/a-master-perfumers-reflections-on-patchouli-and-vetiver/ 4 | -------------------------------------------------------------------------------- /.mozilla.org.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: comments 2 | prune: no 3 | date: //p[@class="entry-posted"]//abbr[@class="published"]/@title 4 | 5 | test_url: https://hacks.mozilla.org/2013/05/how-to-spread-the-word-about-your-code/ -------------------------------------------------------------------------------- /.philhist.unibas.ch.txt: -------------------------------------------------------------------------------- 1 | body: (//div[contains(concat(" ",normalize-space(@class)," ")," content-unibas ")])[1] 2 | 3 | prune: no 4 | 5 | test_url: https://dg.philhist.unibas.ch/de/studium/werkzeugkasten-geschichte/wissenschaftliches-arbeiten/quellenanalyse/ 6 | -------------------------------------------------------------------------------- /.readthedocs.io.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@role='main'] 3 | test_url: http://docs.readthedocs.io/en/latest/getting_started.html 4 | -------------------------------------------------------------------------------- /.redbullmusicacademy.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' body ')] 2 | title: //h1[contains(concat(' ',normalize-space(@class),' '),' headline-main ')] 3 | 4 | test_url: https://daily.redbullmusicacademy.com/2014/11/pizzicato-five-feature 5 | 6 | -------------------------------------------------------------------------------- /.repubblica.it.txt: -------------------------------------------------------------------------------- 1 | body: //div[@itemprop="articleBody"] 2 | 3 | prune: no 4 | 5 | test_url: https://rep.repubblica.it/pwa/longform/2020/05/27/news/rsa_morti_coronavirus_trivulzio-257664697/?ref=RHPPTP-BH-I257793309-C12-P7-S1.12-T1 6 | -------------------------------------------------------------------------------- /.rmt.yml: -------------------------------------------------------------------------------- 1 | vcs: 2 | name: git 3 | sign-tag: false 4 | sign-commit: false 5 | version-generator: semantic 6 | version-persister: vcs-tag 7 | post-release-actions: [vcs-publish] 8 | -------------------------------------------------------------------------------- /.robweychert.com.txt: -------------------------------------------------------------------------------- 1 | body: //article[@id='post'] 2 | title: //h1[@class='title'] 3 | prune: no 4 | strip_id_or_class: metadata 5 | strip: //footer 6 | 7 | test_url: https://v6.robweychert.com/blog/2023/02/field-day-nyc/ 8 | 9 | -------------------------------------------------------------------------------- /.sodexo.com.txt: -------------------------------------------------------------------------------- 1 | body: //main[@id='main'] 2 | 3 | strip: //button 4 | 5 | test_url: https://uk.sodexo.com/home/media/news-room/newsList-area/uk-press-releases/SSAFA-Friendly-to-Forces.html 6 | -------------------------------------------------------------------------------- /.stanford.edu.txt: -------------------------------------------------------------------------------- 1 | title: //div[@id='aueditable']/h1 2 | body: //div[@id='content'] 3 | strip: //div[@id='message' or @id='linklist'] 4 | prune: no 5 | test_url: http://plato.stanford.edu/entries/supervenience/ -------------------------------------------------------------------------------- /.tweakblogs.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class="article"] 2 | author: //p[@class="author"]/a 3 | 4 | test_url: http://harryl.tweakblogs.net/blog/11988/voorstellen 5 | -------------------------------------------------------------------------------- /24.ae.txt: -------------------------------------------------------------------------------- 1 | title: //div[@id='DivTitle'] 2 | body: //div[@id='divImages' or @id='Divkhabarcontent'] 3 | author: //div[@id='DivAuthor'] 4 | 5 | prune: no 6 | 7 | test_url: http://24.ae/article.aspx?ArticleId=123304 8 | test_url: http://24.ae/rss.aspx?pageId=30 9 | -------------------------------------------------------------------------------- /24a11y.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | author: substring-after(//div[contains(@class, "author-description")]//h2[@class="author-title"], 'About') 3 | 4 | test_url: https://www.24a11y.com/2018/web-components-still-need-to-be-accessible/ 5 | -------------------------------------------------------------------------------- /24joursdeweb.fr.txt: -------------------------------------------------------------------------------- 1 | author: substring-after(//h2[@class='post-author-title'], 'À propos de ') 2 | date: //p[@class="post-metas"]//time/@datetime 3 | 4 | test_url: https://www.24joursdeweb.fr/2020/impact-environnemental-du-numerique-quelles-regulations/ 5 | -------------------------------------------------------------------------------- /36kr.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[contains(@class, 'entry-title')] 2 | date: //meta[@name='weibo: article:create_at']/@content 3 | body: //div[contains(@class, 'mainContent')] 4 | strip_id_or_class: related_topics 5 | 6 | prune: no 7 | 8 | test_url: http://www.36kr.com/p/207879.html -------------------------------------------------------------------------------- /37signals.com.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class='post_header']//h2/a 2 | author: //span[@class='author'] 3 | date: //span[@class='date'] 4 | body: //div[@id='Content'] 5 | 6 | test_url: http://37signals.com/svn/posts/2785-the-end-of-the-it-department -------------------------------------------------------------------------------- /43folders.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[@class = 'content'] 2 | author: //*[@class = 'submitted']/a 3 | date: substring-after(//*[@class = 'submitted']/text(), '|') 4 | test_url: http://www.43folders.com/2011/04/22/cranking -------------------------------------------------------------------------------- /512pixels.net.txt: -------------------------------------------------------------------------------- 1 | title: //meta[@property='og:title']/@content 2 | test_url: http://www.512pixels.net/blog/2014/10/the-move 3 | -------------------------------------------------------------------------------- /5by5.tv.txt: -------------------------------------------------------------------------------- 1 | body: //*[@id="episode"] 2 | prune: no 3 | tidy: no 4 | 5 | autodetect_next_page: no 6 | strip_id_or_class: player 7 | 8 | strip://*[@id="header"] 9 | test_url: http://5by5.tv/buildanalyze/60 -------------------------------------------------------------------------------- /7newsbelize.com.txt: -------------------------------------------------------------------------------- 1 | title: //*[@id='sstitle'] 2 | body: //div[@id='sstory'] 3 | strip_id_or_class: newsoptions 4 | prune: no 5 | 6 | test_url: http://www.7newsbelize.com/sstory.php?nid=25654 7 | test_url: http://www.7newsbelize.com/7news.xml -------------------------------------------------------------------------------- /9to5mac.com.txt: -------------------------------------------------------------------------------- 1 | strip: //p[preceding::hr]/span[@class="embed-youtube"] 2 | strip: //hr 3 | 4 | test_url: https://9to5mac.com/2017/04/14/toshiba-semiconductor-business-apple-foxconn/ 5 | -------------------------------------------------------------------------------- /LICENSE.txt: -------------------------------------------------------------------------------- 1 | These files are released to the public domain. 2 | 3 | See https://creativecommons.org/publicdomain/zero/1.0/ for more information. 4 | -------------------------------------------------------------------------------- /RMT: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env php 2 | ):

4 | 5 | single_page_link: //div[@class="up-header"]/a 6 | 7 | prune: no 8 | 9 | test_url: http://hvg.hu/w/20111125_sparta -------------------------------------------------------------------------------- /ianlewis.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class), ' '),' post-content ')] 2 | 3 | test_url: https://www.ianlewis.org/en/almighty-pause-container 4 | -------------------------------------------------------------------------------- /iansommerville.com.txt: -------------------------------------------------------------------------------- 1 | http_header(user-agent): PHP/5.3 2 | 3 | test_url: http://iansommerville.com/blog/a-guide-to-scottish-delicacies-for-tgo-challengers/ 4 | -------------------------------------------------------------------------------- /icannabis.tumblr.com.txt: -------------------------------------------------------------------------------- 1 | tidy:no 2 | prune:no 3 | 4 | body://div[contains(@id,'content')] 5 | 6 | strip_id_or_class:meta 7 | strip_id_or_class:notes 8 | strip_id_or_class:pagination 9 | test_url: http://icannabis.tumblr.com/post/28660592471/reviewmswireless3000 -------------------------------------------------------------------------------- /ilyabirman.ru.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class='published visible e2-smart-title']//span 2 | author: //span[@id='e2-blog-title'] 3 | date: //p[@class='super-h'] 4 | body: //div[@class='text published visible'] 5 | test_url: http://ilyabirman.ru/meanwhile/2011/11/15/2/ -------------------------------------------------------------------------------- /indehekken.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='post-entry']/p 2 | 3 | test_url: http://www.indehekken.net/you-only-sing-when-youre-rowing/ 4 | -------------------------------------------------------------------------------- /indiatimes.com.txt: -------------------------------------------------------------------------------- 1 | body: //figure[@class='mainVideo'] 2 | strip: //figcaption 3 | 4 | prune: no 5 | 6 | test_url: http://www.indiatimes.com/bollywood/kareena-insecure-about-saif-working-with-bipasha-23386.html -------------------------------------------------------------------------------- /indiehackers.com.txt: -------------------------------------------------------------------------------- 1 | prune: no 2 | body: //div[@itemprop="articleBody"] 3 | strip: //aside 4 | strip_id_or_class: partner-spot 5 | 6 | test_url: https://www.indiehackers.com/businesses/paleo-meal-plans 7 | -------------------------------------------------------------------------------- /inessential.com.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class='weblogPost']/h3[1] 2 | author: ("Brent Simmons") 3 | date: //span[@class="weblogPostDisplayDate"] 4 | body: //div[@class='weblogPostBody'] 5 | test_url: http://inessential.com/2011/10/25/why_just_store_the_app_data_on_dropbo -------------------------------------------------------------------------------- /information.dk.txt: -------------------------------------------------------------------------------- 1 | title: //meta[@property='og:title']/@content 2 | author: //*[@property='dc:creator'] 3 | date: //*[@property='dc:date']/@content 4 | body: //div[@id='page-content']//div[contains(@class, 'article-body')] 5 | 6 | tidy: no 7 | test_url: http://www.information.dk/282307 -------------------------------------------------------------------------------- /informationclearinghouse.info.txt: -------------------------------------------------------------------------------- 1 | title: //head/title 2 | body: //table[@id='table3']//div[@class='postContent'] 3 | prune: no 4 | tidy: no 5 | 6 | test_url: http://www.informationclearinghouse.info/article28238.htm -------------------------------------------------------------------------------- /inhabitat.com.txt: -------------------------------------------------------------------------------- 1 | # set body 2 | body: //div[@class='post-listing'] 3 | 4 | # remove clutter 5 | strip: //a/big 6 | strip: //a/em 7 | strip: //p/em 8 | test_url: http://inhabitat.com/2010/11/18/sliding-walls-transform-this-tokyo-house-into-an-office/ -------------------------------------------------------------------------------- /instagr.am.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class='caption'] 2 | author: //p[@class='username'] 3 | 4 | strip: //div[@class='contents']/h3 5 | strip: //div[@class='location'] 6 | test_url: http://instagr.am/p/G-s_aciyDJ/ -------------------------------------------------------------------------------- /interconnected.org.txt: -------------------------------------------------------------------------------- 1 | body: //article[1] 2 | date: //meta[@property="og:updated_time"]/@content 3 | 4 | strip: //h2[1] 5 | strip: //h5[1] 6 | 7 | prune: no 8 | tidy: no 9 | 10 | test_url: https://interconnected.org/home/2020/09/10/streak 11 | -------------------------------------------------------------------------------- /interviewmagazine.com.txt: -------------------------------------------------------------------------------- 1 | title: //title 2 | body: //div[contains(@class, 'block')] 3 | 4 | test_url: http://www.interviewmagazine.com/film/spike-jonze -------------------------------------------------------------------------------- /iphonetweak.fr.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class='fond_titre']/h1[@class='post-title'] 2 | body: //div[@class="post-chapo"] 3 | 4 | test_url: http://iphonetweak.fr/2016/05/20/apple-watch-deja-jailbreakee 5 | -------------------------------------------------------------------------------- /iplaysoft.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content']//div[@class='entry-banner' or @class='entry-content'] 2 | test_url: http://www.iplaysoft.com/webbrowserpassview.html -------------------------------------------------------------------------------- /ishadeed.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | author: //h2[@class="post-author__name"] 3 | 4 | test_url: https://ishadeed.com/article/cascade-layers/ 5 | -------------------------------------------------------------------------------- /isource.com.txt: -------------------------------------------------------------------------------- 1 | # Remove social buttons 2 | strip: //div[@id='temp_Content_Right'] 3 | 4 | # Remove duplicate article title 5 | strip: //*[(@class='storytitle')] 6 | test_url: http://isource.com/2010/10/24/swearch-a-cool-iphone-web-app/ -------------------------------------------------------------------------------- /itavisen.no.txt: -------------------------------------------------------------------------------- 1 | author: //p[@class = 'byline']//span[@class='author'] 2 | 3 | body: //div[@id = 'story-contents'] 4 | test_url: http://itavisen.no/2015/09/08/norske-nettleverandorer-vil-ikke-blokkere-pirate-bay/ 5 | -------------------------------------------------------------------------------- /itmedia.co.jp.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='cmsBody'] 2 | 3 | next_page_link: //span[@id='next']/a 4 | 5 | strip_id_or_class: cmsCopyright 6 | strip_id_or_class: masterSocialbuttonBtm 7 | 8 | test_url: http://www.itmedia.co.jp/enterprise/articles/0912/05/news002.html -------------------------------------------------------------------------------- /itsfoss.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //article[contains(@class,'type-post')]/div[@itemprop='text'] 3 | strip: //a[@rel='dofollow'] 4 | strip: //div[contains(@class,'zem_rp_wrap')] 5 | strip: //div[@id='shr_canvas2'] 6 | test_url: https://itsfoss.com/fix-gvfsd-smb-high-cpu-ubuntu/ 7 | -------------------------------------------------------------------------------- /itwire.com.txt: -------------------------------------------------------------------------------- 1 | author: //a[@rel="author"] 2 | date: //li[@class="itemDateCreated"] 3 | strip: //div[contains(@class, 'legend-rounded')] 4 | 5 | test_url: http://www.itwire.com/it-industry-news/market/59661-ibm-looks-to-high-value-solutions-to-meet-changing-demands 6 | -------------------------------------------------------------------------------- /izismile.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[starts-with(@id, 'news-id-')] 2 | prune: no 3 | 4 | test_url: http://izismile.com/2011/06/13/uncanny_factoid_fashion_or_creepy_2_pics.html -------------------------------------------------------------------------------- /jacobin.com.txt: -------------------------------------------------------------------------------- 1 | body: //article[contains(@class, 'po__article')] 2 | 3 | strip: //aside 4 | strip: //footer 5 | 6 | prune: no 7 | 8 | test_url: https://www.jacobin.com/2019/07/noam-chomsky-interview-climate-change-imperialism 9 | -------------------------------------------------------------------------------- /jalopnik.com.txt: -------------------------------------------------------------------------------- 1 | title: //head/title 2 | author: //meta[@name="author"]/@content 3 | body: //div[contains(@class, 'js_post-content')] 4 | strip: //div[contains(@class, 'content-summary')] 5 | 6 | test_url: http://jalopnik.com/5892124/1955-porsche-550-spyder-sells-for-record-3685-million/ 7 | -------------------------------------------------------------------------------- /jamesclear.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'entry-content')] 2 | 3 | test_url: https://jamesclear.com/procrastination 4 | -------------------------------------------------------------------------------- /jandan.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content']//div[@class = 'post f'] 2 | strip_id_or_class: comment-big 3 | strip_id_or_class: avatar 4 | strip: //div[@class='time_s'] 5 | 6 | test_url: http://jandan.net/2011/04/03/iphone-5-sony.html -------------------------------------------------------------------------------- /je-suis-papa.com.txt: -------------------------------------------------------------------------------- 1 | strip: //noscript 2 | 3 | test_url: http://www.je-suis-papa.com/pandacraft-kit-educatif-creatif-abonnement-12-ans/ 4 | -------------------------------------------------------------------------------- /jjahnke.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='entry'] 2 | prune: no 3 | 4 | test_url: http://www.jjahnke.net/rundbr87.html#2514 -------------------------------------------------------------------------------- /jobbank.gc.ca.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='formatCont_en'] 2 | 3 | prune: no 4 | 5 | test_url: http://www.jobbank.gc.ca/detail-eng.aspx?Source=JobPosting&OrderNum=6397922 -------------------------------------------------------------------------------- /jollinger.com.txt: -------------------------------------------------------------------------------- 1 | body: //body 2 | 3 | test_url: http://www.jollinger.com/photo/enlargers/guide-to-enlargers.htm 4 | -------------------------------------------------------------------------------- /journal.markusthoma.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='entry-content'] 2 | strip_id_or_class: bcac-item 3 | strip_id_or_class: crp_related 4 | strip_id_or_class: optin-after-content 5 | strip: //h2 6 | 7 | test_url: https://journal.markusthoma.com/gegenlicht-fotografie/ 8 | 9 | -------------------------------------------------------------------------------- /juliareda.eu.txt: -------------------------------------------------------------------------------- 1 | body: //article 2 | 3 | strip: //aside[contains(@class, "mashsb-container")] 4 | 5 | test_url: https://juliareda.eu/2019/02/eu-copyright-final-text/ 6 | -------------------------------------------------------------------------------- /jungle-world.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[contains(@class,'story')] 3 | test_url: http://jungle-world.com/artikel/2015/02/51207.html 4 | -------------------------------------------------------------------------------- /jvt.me.txt: -------------------------------------------------------------------------------- 1 | author: //div[@class="post-details"]//a[contains(@class, "p-name")] 2 | 3 | test_url: https://www.jvt.me/posts/2019/10/20/indieweb-talk/ 4 | -------------------------------------------------------------------------------- /kachestvo.ru.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'inner_content')] 2 | 3 | test_url: http://kachestvo.ru/promtovar/odezhda/denim.html -------------------------------------------------------------------------------- /kathimerini.gr.txt: -------------------------------------------------------------------------------- 1 | title: //td[contains(@class, 'articleTitlos')] 2 | body: //td[contains(@class, 'eelantext')] 3 | 4 | test_url: http://www.kathimerini.gr/4dcgi/_w_articles_kathremote_1_03/12/2013_530490 -------------------------------------------------------------------------------- /keyboardmag.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='article-inner'] 2 | strip_id_or_class: date 3 | author: //div[@class='author'] 4 | test_url: http://www.keyboardmag.com/gear/1183/review-dave-smith-instruments-ob-6/58802 5 | -------------------------------------------------------------------------------- /keycloak.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content'] 2 | 3 | strip_id_or_class: preamble 4 | strip_id_or_class: sidebarblock 5 | 6 | test_url: https://www.keycloak.org/docs/12.0/authorization_services/ 7 | -------------------------------------------------------------------------------- /kickstarter.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@id='name'] 2 | body: //*[@id='leftcol'] 3 | 4 | strip_id_or_class: 'share-box' 5 | strip_id_or_class: 'project-faqs' 6 | strip_id_or_class: 'report-issue-wrap' 7 | test_url: http://www.kickstarter.com/projects/hop/elevation-dock-the-best-dock-for-iphone -------------------------------------------------------------------------------- /kingarthurflour.com.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class='post']/h2 2 | body: //div[@class='entry'] 3 | strip: //p[contains(.,'Tags:')] 4 | test_url: http://www.kingarthurflour.com/blog/2011/01/28/a-big-sandwich-for-the-big-game/ -------------------------------------------------------------------------------- /kont.me.txt: -------------------------------------------------------------------------------- 1 | http_header(User-agent): twitterbot 2 | 3 | test_url: https://kont.me/%C3%A9loge-d%C3%A9croissance-individuelle 4 | -------------------------------------------------------------------------------- /kotaku.com.txt: -------------------------------------------------------------------------------- 1 | title: //head/title 2 | author: //meta[@name="author"]/@content 3 | body: //div[contains(@class, 'js_post-content')] 4 | strip: //div[contains(@class, 'content-summary')] 5 | 6 | test_url: https://kotaku.com/tumblr-porn-ban-leaves-artists-and-fans-seeking-new-pla-1831056412 7 | -------------------------------------------------------------------------------- /kottke.org.txt: -------------------------------------------------------------------------------- 1 | title: //h2 2 | author: //*[@id='main']/div/a[1] 3 | date: substring-before(substring-after(//div[@class='meta'],'•'),'•') 4 | body: //div[@id='main'] 5 | strip: //div[@class='meta'] 6 | test_url: http://kottke.org/08/02/king-of-kong-a-fistful-of-quarters -------------------------------------------------------------------------------- /kresus.org.txt: -------------------------------------------------------------------------------- 1 | title: //h2[@class="entry-title"] 2 | date: //time[@class="published"]/@datetime 3 | 4 | test_url: https://kresus.org/blog/kresus-version-0-14-0.html 5 | -------------------------------------------------------------------------------- /krone.at.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' kmm-article-box ')] 2 | 3 | test_url: https://www.krone.at/1941895 4 | -------------------------------------------------------------------------------- /kumailplus.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class = "entry-full"] 2 | 3 | test_url: http://www.kumailplus.com/2011/12/02/24308 -------------------------------------------------------------------------------- /labs.bishopfox.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[contains(concat(' ',normalize-space(@class),' '),' blog-post__title ')] 2 | body: //div[contains(concat(' ',normalize-space(@class),' '),' blog-post__body ')] 3 | test_url: https://labs.bishopfox.com/tech-blog/bad-pods-kubernetes-pod-privilege-escalation 4 | -------------------------------------------------------------------------------- /labs.mwrinfosecurity.com.txt: -------------------------------------------------------------------------------- 1 | # Title is not detected automatically 2 | title: //section[contains(@class, 'section-intro')]//h1 3 | 4 | test_url: https://labs.mwrinfosecurity.com/blog/hp-nonstop-basics/ 5 | -------------------------------------------------------------------------------- /labs.ripe.net.txt: -------------------------------------------------------------------------------- 1 | body: //article[@class="prose"] 2 | 3 | test_url: https://labs.ripe.net/author/kathleen_moriarty/the-llm-misinformation-problem-i-was-not-expecting/ 4 | test_contains: The problems around vetting AI results won't be going away anytime soon. 5 | -------------------------------------------------------------------------------- /lado.mx.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //a[starts-with(@href, 'http') and contains(., 'Leer noticia completa')] 2 | 3 | test_url: https://lado.mx/noticia.php?id=15249243 4 | -------------------------------------------------------------------------------- /laughingsquid.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class='entry-title'] 2 | body: //div[@class='entry-content'] 3 | test_url: http://laughingsquid.com/mysterious-tiny-doors-appearing-around-san-francisco/ -------------------------------------------------------------------------------- /lawfareblog.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'node-body')]//div[@class='field-items'] 2 | title: //div[@class='title'] 3 | 4 | test_url: https://lawfareblog.com/limits-panopticon 5 | -------------------------------------------------------------------------------- /leb.fbi.gov.txt: -------------------------------------------------------------------------------- 1 | body: //section[@id="main-content"] 2 | body: //div[@id="main-content-container"] 3 | 4 | prune: no 5 | 6 | test_url: https://leb.fbi.gov/articles/featured-articles/current-state-of-interview-and-interrogation 7 | -------------------------------------------------------------------------------- /lefilrouge.media.txt: -------------------------------------------------------------------------------- 1 | 2 | strip_id_or_class: the_champ_sharing_container 3 | 4 | test_url: https://lefilrouge.media/etats-unis-nevada-burning-man-festival/ 5 | -------------------------------------------------------------------------------- /lehollandaisvolant.net.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class="blog-post-title"] 2 | date: //time[contains(@itemprop, "datePublished")]/@datetime 3 | 4 | test_url: https://lehollandaisvolant.net/?d=2019/12/07/11/41/38-non-respirer-nemet-pas-plus-de-co2-dans-latmosphere 5 | -------------------------------------------------------------------------------- /lesecolohumanistes.fr.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' single ')]/*[not(self::figure)] 2 | 3 | test_url: https://lesecolohumanistes.fr/interdependance/ 4 | -------------------------------------------------------------------------------- /lesswrong.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' PostsPage-postContent ')] 2 | title: //h1[contains(@class, "PostsPageTitle-root")] 3 | 4 | prune: no 5 | 6 | test_url: https://www.lesswrong.com/posts/FfrWGCEhZJbkeFgww/the-power-to-demolish-bad-arguments 7 | -------------------------------------------------------------------------------- /letraslibres.com.txt: -------------------------------------------------------------------------------- 1 | single_page_link: concat(link[@rel="canonical"], "?page=full") 2 | 3 | test_url: http://www.letraslibres.com/revista/dossier/quien-manda-en-europa 4 | -------------------------------------------------------------------------------- /lezephyrmag.com.txt: -------------------------------------------------------------------------------- 1 | 2 | body: //div[contains(concat(' ',normalize-space(@class),' '),' entry-content ')] 3 | 4 | strip_id_or_class: swp_social_panel 5 | 6 | test_url: https://lezephyrmag.com/libre/paroles/jean-roch-waro-voyager-avec-la-musique-est-un-acte-poetique/ 7 | -------------------------------------------------------------------------------- /libcom.org.txt: -------------------------------------------------------------------------------- 1 | date: //span[contains(@class, 'page-date')] 2 | body: //div[@id='node-page'] 3 | strip_id_or_class: book-navigation 4 | prune: no 5 | 6 | test_url: http://libcom.org/library/what-was-the-ussr-aufheben-1 7 | test_url: http://libcom.org/library-latest/feed -------------------------------------------------------------------------------- /lifehack.org.txt: -------------------------------------------------------------------------------- 1 | # Two articles appear, so we always want to pick the first. 2 | body: (//div[contains(@class, 'article-content')])[1] 3 | 4 | test_url: https://www.lifehack.org/566117/how-meditate-for-beginners 5 | -------------------------------------------------------------------------------- /linux.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' article-content ')] 2 | 3 | author: //div[contains(concat(' ',normalize-space(@class),' '),' td-post-author-name ')]/a 4 | 5 | test_url: https://www.linux.com/tutorials/lf-networking-releases-onap-dublin/ 6 | -------------------------------------------------------------------------------- /linuxjournal.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='content-area'] 2 | next_page_link: //a[@title='Go to next page'] 3 | author: //a[@title='View user profile.'] 4 | strip_id_or_class: comments 5 | 6 | test_url: http://www.linuxjournal.com/content/be-mechanicwith-android-and-linux 7 | -------------------------------------------------------------------------------- /linuxnix.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' entry-content ')] 2 | strip_id_or_class: ts-fab-wrapper 3 | 4 | test_url: https://www.linuxnix.com/how-to-rotate-logs-manually-in-linux/ 5 | -------------------------------------------------------------------------------- /literaryreview.co.uk.txt: -------------------------------------------------------------------------------- 1 | date: //meta[@itemprop="datePublished]/@content 2 | title: //meta[@property="og:title"]/@content 3 | author: (//h1[@itemprop="author"])[1] 4 | 5 | test_url: https://literaryreview.co.uk/the-woolworths-poltergeist 6 | -------------------------------------------------------------------------------- /longform.org.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //div[@class="post"]/div[@class="title"]/a 2 | 3 | test_url: http://longform.org/2011/05/06/disconcerting-new-answers-in-models-suicide/ -------------------------------------------------------------------------------- /lostgarden.com.txt: -------------------------------------------------------------------------------- 1 | prune: no 2 | convert_double_br_tags: yes 3 | test_url: http://www.lostgarden.com/2012/04/loops-and-arcs.html -------------------------------------------------------------------------------- /lukew.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | 3 | test_url: https://www.lukew.com/ff/entry.asp?1995 4 | -------------------------------------------------------------------------------- /luminous-landscape.com.txt: -------------------------------------------------------------------------------- 1 | title: //h2 2 | 3 | body: // div[@id='content'] 4 | 5 | strip: //div[@class='sidebar_wrapper'] 6 | test_url: http://www.luminous-landscape.com/tutorials/optimizing_exposure.shtml -------------------------------------------------------------------------------- /lupa.cz.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: promo-in-article 2 | strip_id_or_class: element-print-hidden 3 | 4 | test_url: http://www.lupa.cz/clanky/michal-zamec-parfums-za-dva-roky-presahneme-obrat-6-miliard-korun/ 5 | -------------------------------------------------------------------------------- /luxuo.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='post-content'] 2 | prune: no 3 | 4 | test_url: http://www.luxuo.com/watches/feed -------------------------------------------------------------------------------- /lvsl.fr.txt: -------------------------------------------------------------------------------- 1 | title: //h1[contains(@class,'entry-title')] 2 | body: //div[contains(@class,'body-content')] 3 | test_url: http://lvsl.fr/peuple-manifestant-saez-a-t-pondu-hexagone 4 | -------------------------------------------------------------------------------- /lwlies.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' singleColRight ')] 2 | 3 | test_url: https://lwlies.com/articles/rope-alfred-hitchcock-masterpiece/ 4 | -------------------------------------------------------------------------------- /m.theregister.co.uk.txt: -------------------------------------------------------------------------------- 1 | strip: //div[@class='wptl btm'] 2 | body: //div[@id='article']//h2 | //div[@id='body'] 3 | 4 | test_url: http://m.theregister.co.uk/2015/07/06/geeks_guide_spaceguard_center/ 5 | -------------------------------------------------------------------------------- /m.xkcd.com.txt: -------------------------------------------------------------------------------- 1 | body: //body 2 | prune: no 3 | strip_id_or_class: navButtons 4 | strip_id_or_class: news 5 | strip_id_or_class: footerLinks 6 | strip_id_or_class: altTextLink 7 | test_url: https://m.xkcd.com/2057/ 8 | -------------------------------------------------------------------------------- /macdrifter.com.txt: -------------------------------------------------------------------------------- 1 | title: substring-before(//title,' « Macdrifter') 2 | test_url: http://www.macdrifter.com/2012/03/instacast-on-my-mac/ -------------------------------------------------------------------------------- /macg.co.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' print:shadow-none ')]//article 2 | strip: //footer 3 | strip_id_or_class: comments 4 | 5 | test_url: https://www.macg.co/ailleurs/2024/10/microsoft-donne-des-yeux-et-une-voix-lia-de-copilot-146279 6 | -------------------------------------------------------------------------------- /mactechnews.de.txt: -------------------------------------------------------------------------------- 1 | title: substring-after(substring-after(//title, '>'), '>') 2 | body: //div[@class='NewsArticleContent'] 3 | test_url: http://www.mactechnews.de/news/index/Apple-Pressekonferenz-zum-iPhone-4-147316.html -------------------------------------------------------------------------------- /maitre-eolas.fr.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class="post-content"] 2 | author: //meta[@name="author"]/@content 3 | date: //meta[@name="date"]/@content 4 | 5 | test_url: http://www.maitre-eolas.fr/post/2018/05/13/Pour-en-finir-avec-les-fiches-S 6 | -------------------------------------------------------------------------------- /make.wordpress.org.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: glossary-item-hidden-content 2 | 3 | test_url: https://make.wordpress.org/core/2020/12/21/bug-scrub-schedule-for-5-7/ 4 | -------------------------------------------------------------------------------- /manga-news.com.txt: -------------------------------------------------------------------------------- 1 | title: //h2[@class='actu-title'] 2 | 3 | body: //div[@class='actu-content'] 4 | 5 | prune: no 6 | 7 | test_url: http://www.manga-news.com/index.php/actus/2016/02/02/Deux-retours-dans-le-planning-des-editions-Pika 8 | -------------------------------------------------------------------------------- /marco.org.txt: -------------------------------------------------------------------------------- 1 | tidy: no 2 | prune: no 3 | date: //article//time[@pubdate] 4 | title: //article/header/h2 5 | body: //article 6 | strip: //header 7 | test_url: http://www.marco.org/2012/09/08/businessweek-gruber 8 | test_url: http://www.marco.org/2012/04/24/might-upgrade-someday -------------------------------------------------------------------------------- /marcvidal.net.txt: -------------------------------------------------------------------------------- 1 | title: //div[contains(@class, 'post-title')] 2 | body: //article/div 3 | 4 | skip_json_ld: yes 5 | 6 | test_url: https://www.marcvidal.net/blog/2019/1/8/google-ya-es-un-banco-europeo-y-ahora-que 7 | -------------------------------------------------------------------------------- /marigold.cz.txt: -------------------------------------------------------------------------------- 1 | http_header(accept): */* 2 | 3 | test_url: https://www.marigold.cz/item/projektovy-manazer-je-v-cesku-sproste-slovo-ke-skode-projektu 4 | -------------------------------------------------------------------------------- /maritimedanmark.dk.txt: -------------------------------------------------------------------------------- 1 | body: //main[contains(concat(' ',normalize-space(@class),' '),' relative ')] 2 | 3 | strip: //div[contains(@class, 'js-banner-promoted')] 4 | 5 | test_url: https://www.maritimedanmark.dk/nkts-nye-kabelskib-kan-operere-pa-metanol 6 | -------------------------------------------------------------------------------- /marketresearchdirect.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id="product_tabs-0"] 2 | 3 | test_url: https://www.marketresearchdirect.com/consumer-goods/smart-lighting-market-in-india-2018-2023-market-report 4 | -------------------------------------------------------------------------------- /marksdailyapple.com.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: wwsgd 2 | test_url: http://www.marksdailyapple.com/are-detoxes-and-cleanses-safe-and-effective/ -------------------------------------------------------------------------------- /marmiton.org.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class="main-title"] 2 | author: //span[@class="recipe-author__name"] 3 | body: //div[@id="sticky-desktop-only"] 4 | strip: //div[@id="bloc-video"] 5 | 6 | test_url: http://www.marmiton.org/recettes/recette_gateau-au-chocolat-fondant-rapide_166352.aspx 7 | -------------------------------------------------------------------------------- /marriedtothesea.com.txt: -------------------------------------------------------------------------------- 1 | body: //img[contains(@src, '.gif')] 2 | 3 | test_url: http://www.marriedtothesea.com 4 | test_url: http://www.marriedtothesea.com/index.php?date=010818 5 | -------------------------------------------------------------------------------- /matt.might.net.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | author: string("Matt Might") 3 | strip: //h1/following-sibling::div 4 | 5 | test_url: http://matt.might.net/articles/oo-cesk/ -------------------------------------------------------------------------------- /mattcutts.com.txt: -------------------------------------------------------------------------------- 1 | date: //*[@class = 'published'] 2 | test_url: http://www.mattcutts.com/blog/internet-censorship-sopa/ -------------------------------------------------------------------------------- /maxim.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'field-name-body') or contains(@class, 'featured-image')] 2 | 3 | test_url: http://www.maxim.com/rss-feeds.xml 4 | test_url: http://www.maxim.com/entertainment/article/second-city-chicago-goes-flames -------------------------------------------------------------------------------- /mbk-news.appspot.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'evo-entry-content')] 2 | 3 | prune: no 4 | 5 | test_url: https://mbk-news.appspot.com/suzhet/ee-imya-budet/ 6 | -------------------------------------------------------------------------------- /mbl.is.txt: -------------------------------------------------------------------------------- 1 | body: //div[class="frett-main"] 2 | test_url: http://mbl.is/frettir/innlent/2012/02/21/litill_munur_a_fargjaldaverdi/ -------------------------------------------------------------------------------- /mcorbin.fr.txt: -------------------------------------------------------------------------------- 1 | title: //div[contains(concat(' ',normalize-space(@class),' '),' post-header ')]//h2 2 | body: //div[@id="post"]/div[2] 3 | test_url: https://www.mcorbin.fr/posts/2023-07-04-metriques/ -------------------------------------------------------------------------------- /mebedo.de.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' av_two_third ')] 2 | 3 | test_url: https://www.mebedo.de/themen/faq-zur-verantwortlichen-elektrofachkraft-vefk/ 4 | -------------------------------------------------------------------------------- /medialens.org.txt: -------------------------------------------------------------------------------- 1 | author: //meta[@property="og:site_name"]/@content 2 | prune: no 3 | test_url: https://www.medialens.org/2012/the-illusion-of-democracy/ 4 | test_contains: In an era of permanent war, economic meltdown 5 | -------------------------------------------------------------------------------- /mein-mmo.de.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='gp-entry-text'] 2 | strip: //aside 3 | 4 | test_url: http://mein-mmo.de/pokemon-go-15-staerksten-pokemon-der-2-generation/ 5 | -------------------------------------------------------------------------------- /mentalfloss.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'article-content')][1] 2 | author: //div[contains(@class, 'author')][1] 3 | 4 | strip_id_or_class: date-text 5 | strip_id_or_class: after-article-subscribe-nl 6 | strip_id_or_class: eyebrow-text 7 | strip_id_or_class: eyebrow-tail 8 | -------------------------------------------------------------------------------- /meowni.ca.txt: -------------------------------------------------------------------------------- 1 | author: //meta[@name="author"]/@content 2 | 3 | test_url: https://meowni.ca/posts/2017-puppeteer-tests/ 4 | -------------------------------------------------------------------------------- /mesec.cz.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='urs'] | //div[@itemprop='articleBody'] 2 | strip_id_or_class: promo-in-article 3 | 4 | test_url: http://www.mesec.cz/aktuality/ceske-drahy-pridaji-zamestnancum-jejich-mzdy-vzrostou-o-1-7/ 5 | -------------------------------------------------------------------------------- /mforum.cari.com.my.txt: -------------------------------------------------------------------------------- 1 | body: (//td[starts-with(@id, 'postmessage_')])[1] 2 | 3 | prune: no 4 | 5 | test_url: http://mforum.cari.com.my/forum.php?mod=viewthread&tid=788033 6 | test_url: http://mforum.cari.com.my/forum.php?mod=rss&fid=265&auth=0 -------------------------------------------------------------------------------- /microsiervos.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //article 3 | 4 | strip: //div[@class='compartir-post'] 5 | 6 | test_url: https://www.microsiervos.com/archivo/espacio/pequeno-vistazo-interior-edificio-ensamblado-vehiculos-chino.html 7 | -------------------------------------------------------------------------------- /mikeash.com.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class="blogtitle"] 2 | strip: //div[@class="blogtitle"] 3 | 4 | author: substring-after(//span[@class="blogheader"], 'Author: ') 5 | test_url: http://www.mikeash.com/pyblog/friday-qa-2012-01-13-the-mac-toolbox.html -------------------------------------------------------------------------------- /mintpressnews.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' entry-content ')] 2 | 3 | test_url: https://www.mintpressnews.com/mega-group-maxwells-mossad-spy-story-jeffrey-epstein-scandal/261172/ 4 | test_contains: One of those businessmen 5 | -------------------------------------------------------------------------------- /miops.com.txt: -------------------------------------------------------------------------------- 1 | strip: //div[@id="relatedblogs"] 2 | strip: //div[@class="product-card"] 3 | 4 | test_url: https://www.miops.com/blogs/news/master-tips-to-take-lightning-photos 5 | -------------------------------------------------------------------------------- /mirrorfootball.co.uk.txt: -------------------------------------------------------------------------------- 1 | # Remove extra links 2 | strip: //*[@class='appended_html'] 3 | test_url: http://www.mirrorfootball.co.uk/news/West-Ham-crisis-Carlton-Cole-slams-diabolical-performance-and-rips-into-Avram-Grant-lack-of-tactical-nous-following-Liverpool-mauling-article636151.html -------------------------------------------------------------------------------- /mises.org.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: 'book-ad' 2 | strip_id_or_class: 'bigger pullquote' 3 | strip_id_or_class: 'subscribe' 4 | strip_id_or_class: 'blog-link' 5 | test_url: http://mises.org/daily/4804 -------------------------------------------------------------------------------- /missnumerique.com.txt: -------------------------------------------------------------------------------- 1 | strip: //figure/noscript 2 | 3 | test_url: https://www.missnumerique.com/blog/la-proxiphotographie-la-solution-nature-pour-exprimer-son-sens-artistique/ 4 | -------------------------------------------------------------------------------- /mlssoccer.com.txt: -------------------------------------------------------------------------------- 1 | title: //*[@class="header_title"]/h1 2 | date: //*[@class="field-date"] 3 | author: //*[@class="field-author"] 4 | body: //div[contains(@class, 'content')] 5 | 6 | test_url: http://www.mlssoccer.com/news/article/2012/06/19/lack-depth-front-forces-arena-alter-las-formation -------------------------------------------------------------------------------- /mobilenet.cz.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: inarticle--tip 2 | 3 | next_page_link: //a[@class='navChapters__next'] 4 | 5 | test_url: http://mobilenet.cz/clanky/recenze-apple-ipad-pro-tesne-pod-vrcholem-28955 6 | -------------------------------------------------------------------------------- /monkeyuser.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ', normalize-space(@class), ' '), ' content ')] 2 | 3 | test_url: https://www.monkeyuser.com/2019/v-201/ 4 | -------------------------------------------------------------------------------- /monkeyzen.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://monkeyzen.com/2011/09/siluetas-de-clasicos-a-modo-de-vinilos -------------------------------------------------------------------------------- /moo.nac.uci.edu.txt: -------------------------------------------------------------------------------- 1 | title: //div[@id='header']//h1[1] 2 | 3 | body: //div[@id='content'] 4 | 5 | strip_id_or_class: toc 6 | 7 | prune: no 8 | 9 | test_url: http://moo.nac.uci.edu/~hjm/HOWTO_move_data.html 10 | -------------------------------------------------------------------------------- /motorcyclistonline.com.txt: -------------------------------------------------------------------------------- 1 | http_header(cookie): bonnier_consent=true 2 | 3 | strip_id_or_class: arcAdsBox 4 | 5 | author: //div[contains(concat(' ',normalize-space(@class),' '),' by_author ')] 6 | -------------------------------------------------------------------------------- /motorfull.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://motorfull.com/2011/09/aparca-valeo-park4u-remote -------------------------------------------------------------------------------- /msdn.microsoft.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id="mainBody"] 2 | prune: no 3 | test_url: http://msdn.microsoft.com/en-us/library/hh542796(VS.103).aspx 4 | test_url: https://msdn.microsoft.com/library/hh191443(vs.110).aspx 5 | test_contains: An async method typically contains 6 | -------------------------------------------------------------------------------- /muycomputerpro.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class='entry-title'] 2 | body: //div[@id='mvp-content-main'] 3 | 4 | strip: //div[@class='recomienda-wrap'] 5 | 6 | test_url: https://www.muycomputerpro.com/2017/09/20/fundacion-universidad-empresa-hyperloop-one 7 | -------------------------------------------------------------------------------- /mysqlblog.fivefarmers.com.txt: -------------------------------------------------------------------------------- 1 | http_header(User-Agent): Mozilla/5.0 (compatible; Googlebot/2.1; +http://www.google.com/bot.html) 2 | 3 | test_url: http://mysqlblog.fivefarmers.com/2012/08/16/understanding-mysql_config_editors-security-aspects/ 4 | 5 | -------------------------------------------------------------------------------- /mytotalretail.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@itemprop="content"] 3 | 4 | test_url: https://www.mytotalretail.com/article/how-site-search-could-kill-amazon/ 5 | -------------------------------------------------------------------------------- /n-tv.de.txt: -------------------------------------------------------------------------------- 1 | date: //span[@class='article__date'] 2 | title: //title 3 | body: //div[@class='article__text'] 4 | 5 | test_url: https://www.n-tv.de/politik/Die-alten-Maenner-werden-es-nie-blicken-article21447318.html 6 | 7 | # Last update: 2019-12-12 8 | # Tested with: Wallabag 2.3.8 -------------------------------------------------------------------------------- /n.survol.fr.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | date: //header//time/@datetime 3 | 4 | test_url: https://n.survol.fr/n/gerer-son-potager 5 | -------------------------------------------------------------------------------- /najlepsze-ksiazki.pl.txt: -------------------------------------------------------------------------------- 1 | body: //article 2 | 3 | strip: //footer 4 | 5 | test_url: https://najlepsze-ksiazki.pl/najlepsze-ksiazki-science-fiction/ 6 | -------------------------------------------------------------------------------- /nakedsecurity.sophos.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='entry-content'] 2 | title: //div[@class='entry-title'] 3 | strip: //div[@class='entry-sharing'] 4 | 5 | test_url: https://nakedsecurity.sophos.com/2016/04/04/new-ransomware-with-an-old-trick-petya-parties-like-its-1989/ 6 | -------------------------------------------------------------------------------- /neunetz.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'entry-content')] 2 | prune: no 3 | 4 | strip_id_or_class: sharedaddy 5 | 6 | test_url: https://neunetz.com/2019/09/13/apple-tv-quasi-geschenkt/ 7 | test_contains: Apple muss hier noch aufholen 8 | -------------------------------------------------------------------------------- /newcriterion.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' article-text-column ')] 2 | title: //meta[@property="og:title"]/@content 3 | 4 | prune: no 5 | 6 | test_url: https://newcriterion.com/issues/2020/12/acheiropoieta 7 | -------------------------------------------------------------------------------- /news.rambler.ru.txt: -------------------------------------------------------------------------------- 1 | body: //article 2 | title: //h1 3 | author: //span[@class='b-article-source-dropdown'] 4 | strip: //span[@class='b-article-photo-incut__source'] 5 | strip: //a[@class='b-read-more b-read-more_bottom'] 6 | 7 | 8 | tidy:no 9 | test_url: http://news.rambler.ru/12972208/ -------------------------------------------------------------------------------- /news.rub.de.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' content-inner-inner-wrapper ')] 2 | 3 | http_header(Cookie): has_js=1 4 | -------------------------------------------------------------------------------- /news.techmeme.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='main']/div[@class='item'] 2 | strip: //div[@class='right'] 3 | 4 | test_url: http://news.techmeme.com/110516/fh-rip -------------------------------------------------------------------------------- /nextcloud.com.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class="blog-title-and-subtitle"]//h1 2 | date: //time/@datetime 3 | 4 | test_url: https://nextcloud.com/blog/celebrating-2-years-nextcloud/ 5 | -------------------------------------------------------------------------------- /nextdraft.com.txt: -------------------------------------------------------------------------------- 1 | body: //section[contains(concat(' ',normalize-space(@class),' '),' page-content-wrap ')] 2 | strip_id_or_class: social-sharing-wrap 3 | strip_id_or_class: current-edition-title-date 4 | 5 | test_url: https://nextdraft.com/archives/n20221208/ 6 | 7 | -------------------------------------------------------------------------------- /nf-farn.de.txt: -------------------------------------------------------------------------------- 1 | body: //article[contains(concat(" ",normalize-space(@class)," ")," view-mode-full ")] 2 | 3 | prune: no 4 | 5 | test_url: https://www.nf-farn.de/maer-ueberbevoelkerung 6 | -------------------------------------------------------------------------------- /nicj.net.txt: -------------------------------------------------------------------------------- 1 | strip: //h1 2 | strip: //div[@class="info"] 3 | strip: //div[@class="osd-sms-wrapper"] 4 | strip: //div[@id="sidebar"] 5 | strip: //div[@id="postnavi"] 6 | strip: //form[@id="commentform"] 7 | 8 | test_url: https://nicj.net/cumulative-layout-shift-in-practice/ 9 | -------------------------------------------------------------------------------- /nifi.apache.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content'] 2 | 3 | test_url: https://nifi.apache.org/docs/nifi-docs/html/getting-started.html 4 | -------------------------------------------------------------------------------- /nj.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='article_container'] 2 | strip_id_or_class: social 3 | 4 | test_url: http://www.nj.com/eagles/index.ssf/2018/04/should_eagles_trade_brandon_graham_observations.html#incart_river_index 5 | -------------------------------------------------------------------------------- /nojesguiden.se.txt: -------------------------------------------------------------------------------- 1 | author: //span[@class='meta']/span[@class='username'] 2 | body: //div[@class='article-content'] 3 | 4 | strip_id_or_class: 'article-actions' 5 | test_url: http://nojesguiden.se/blogg/maja-bredberg/maja-laser-tidningen-en-helt-vanlig-lordag-i -------------------------------------------------------------------------------- /nosalty.hu.txt: -------------------------------------------------------------------------------- 1 | title: //div[@id='tab-recept']//h1 2 | body: //div[@id='tab-recept']//div[contains(@class, 'column-container')] 3 | strip_id_or_class: ajanlo-box 4 | prune: no 5 | 6 | test_url: http://www.nosalty.hu/recept/szupergyors-fank -------------------------------------------------------------------------------- /novinky.cz.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'tpl-king-top-content')] 2 | 3 | prune: no 4 | strip_id_or_class: ogm-advert 5 | 6 | test_url: https://www.novinky.cz/koronavirus/clanek/zlom-v-boji-s-koronavirem-svycari-chteji-ockovat-uz-na-podzim-40321864 7 | -------------------------------------------------------------------------------- /nplusonemag.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' post-body ')] 2 | 3 | prune: no 4 | 5 | test_url: https://www.nplusonemag.com/online-only/online-only/the-outskirts-of-progress/ 6 | -------------------------------------------------------------------------------- /omiliya.org.txt: -------------------------------------------------------------------------------- 1 | title: //div[@id='squeeze']/h1 2 | strip: //div[@id='squeeze']/h1 3 | author: //div[@class='submitted']/a 4 | strip: //div[@class='submitted']/a 5 | convert_double_br_tags: yes 6 | 7 | 8 | 9 | test_url: http://omiliya.org/content/predchuvstvie.html -------------------------------------------------------------------------------- /onlinewelten.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='news_detail']//div[@class='contents clearfix'] 2 | test_url: http://www.onlinewelten.com/games/aliens-colonial-marines/news/offizielle-spiel-ankuendigung-nintendos-wii-u-103690/ -------------------------------------------------------------------------------- /openai.com.txt: -------------------------------------------------------------------------------- 1 | body: //main 2 | strip: //nav 3 | strip: //*[@aria-hidden="true"] 4 | 5 | # strip additional header-line in text 6 | strip: //main/text() 7 | 8 | prune: no 9 | 10 | test_url: https://openai.com/index/learning-to-reason-with-llms/ 11 | -------------------------------------------------------------------------------- /opensource.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='content clear-block'] 2 | test_url: http://opensource.org/node/537 -------------------------------------------------------------------------------- /openstreetmap.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content'] 2 | strip: //div[@class='standard-form'] 3 | test_url: https://www.openstreetmap.org/user/woodpeck/diary/393947 4 | -------------------------------------------------------------------------------- /openthemagazine.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id = 'content-inner'] 2 | strip: //div[@id = 'content-bottom'] 3 | strip_id_or_class: print_sharebutton 4 | test_url: http://openthemagazine.com/article/nation/sania-vs-saina -------------------------------------------------------------------------------- /optimizesmart.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id="content"] 2 | 3 | prune: no 4 | 5 | test_url: https://www.optimizesmart.com/how-to-set-up-conversion-tracking-in-google-analytics-4/ 6 | -------------------------------------------------------------------------------- /oschina.net.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | strip_id_or_class: syntaxhighlighter 3 | test_url: http://www.oschina.net/translate/event-based-programming-what-async-has-over-sync?print -------------------------------------------------------------------------------- /osmand.net.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class="article"]//h2 2 | date: //meta/@pubdate 3 | 4 | test_url: https://osmand.net/blog/guideline-pt 5 | -------------------------------------------------------------------------------- /osmc.tv.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class="post-title"] 2 | date: //time[@class="post-date"]/@datetime 3 | 4 | test_url: https://osmc.tv/2019/11/osmcs-november-update-is-here-with-kodi-18-5/ 5 | -------------------------------------------------------------------------------- /palmbeachpost.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' story-text ')] 2 | 3 | test_url: http://www.palmbeachpost.com/news/crime--law/new-pbso-releases-sketch-person-interest-shooting/IcToH2Mij0hAw3EIFnw5tL/ 4 | -------------------------------------------------------------------------------- /pandemicequityinitiative.com.txt: -------------------------------------------------------------------------------- 1 | body: //main 2 | 3 | strip: //svg 4 | 5 | test_url: https://www.pandemicequityinitiative.com/hold-misinformation-lies-betrayal 6 | test_contains: Here’s the truth: the pandemic is not over 7 | -------------------------------------------------------------------------------- /pandodaily.com.txt: -------------------------------------------------------------------------------- 1 | tidy: no 2 | body: //article 3 | date: //time/@datetime 4 | strip_id_or_class: sharedaddy 5 | test_url: http://pandodaily.com/2012/01/19/ibooks-author-is-not-going-to-hurt-publishers-it-might-even-help-them/ -------------------------------------------------------------------------------- /panic.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='entry'] 2 | date: //h3[@class='postDate'] 3 | test_url: http://www.panic.com/blog/2011/07/panic-is-ready-for-lion/ -------------------------------------------------------------------------------- /papodehomem.com.br.txt: -------------------------------------------------------------------------------- 1 | title: //h2[@class="page_title"] 2 | body: //div[@class="entry arquivo"] 3 | author: //span[@class="author"] 4 | footnotes: yes 5 | prune: yes 6 | test_url: http://papodehomem.com.br/um-relato-confessional-sobre-a-maioridade-penal/ -------------------------------------------------------------------------------- /paquier.xyz.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='post'] 2 | 3 | test_url: http://paquier.xyz/postgresql-2/postgres-10-incompatible-changes/ 4 | -------------------------------------------------------------------------------- /parislemon.com.txt: -------------------------------------------------------------------------------- 1 | title: //h2[@class="post-title"] 2 | author: substring-after(//div[@class="description"],'Words by ') 3 | date: //li[@class="date"] 4 | strip: //h2[@class="post-title"] 5 | body: //div[@class="copy"] 6 | test_url: http://parislemon.com/post/13462682469/the-15-inch-air -------------------------------------------------------------------------------- /parliament.uk.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@id='news-article'] 3 | test_url: http://www.parliament.uk/business/committees/committees-a-z/commons-select/backbench-business-committee/news/guidance-for-e-petitioners/ -------------------------------------------------------------------------------- /pastebin.com.txt: -------------------------------------------------------------------------------- 1 | title://div[@class="paste_box_line1"]/h1 2 | author://div[@class="paste_box_line2"]/a 3 | body://div[@class="text"] 4 | date:substring-before(substring-after(//div[@class="paste_box_line2"],'|'),'|') 5 | dissolve://li 6 | test_url: http://pastebin.com/LAykd1es -------------------------------------------------------------------------------- /pastepad.fivefilters.org.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@id='ff-pastepad-content'] 3 | prune: no 4 | # todo: add test file 5 | test_url: http://pastepad.fivefilters.org/test.html -------------------------------------------------------------------------------- /pentaxforums.com.txt: -------------------------------------------------------------------------------- 1 | next_page_link: //a[contains(., 'Next:')] 2 | test_url: http://www.pentaxforums.com/reviews/long-exposure-handhelds/introduction.html -------------------------------------------------------------------------------- /perell.com.txt: -------------------------------------------------------------------------------- 1 | body: //section[contains(@class, 'BlogItem-main')] 2 | 3 | test_url: https://www.perell.com/blog/50-ideas-that-changed-my-life 4 | -------------------------------------------------------------------------------- /philosophyforlife.org.txt: -------------------------------------------------------------------------------- 1 | body: //article 2 | replace_string(data-src=):src= 3 | 4 | test_url: https://www.philosophyforlife.org/blog/mind-palaces-the-art-of-psycho-technics-or-soul-craft 5 | -------------------------------------------------------------------------------- /philosophynow.org.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: welcome_box 2 | 3 | test_url: https://philosophynow.org/issues/141/Time_and_Being 4 | -------------------------------------------------------------------------------- /philstar.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@property="content:encoded"] 2 | 3 | test_url: http://www.philstar.com/headlines/2017/03/06/1678561/samuel-martires-named-new-sc-justice 4 | test_url: http://www.philstar.com/rss/breakingnews 5 | -------------------------------------------------------------------------------- /photopills.com.txt: -------------------------------------------------------------------------------- 1 | title: //h2 2 | body: //article[contains(@class, 'post')] 3 | author: //p[@class="author"]//a 4 | 5 | strip: //p[@class="tags"] 6 | strip: //div[@class="freebie"] 7 | 8 | test_url: https://www.photopills.com/articles/depth-of-field-guide 9 | -------------------------------------------------------------------------------- /phototrend.fr.txt: -------------------------------------------------------------------------------- 1 | author: //div[contains(@class, "vcard")] 2 | 3 | test_url: https://phototrend.fr/2019/04/mise-a-jour-luminar-3-1-0-accent-ai-2-0/ 4 | -------------------------------------------------------------------------------- /php.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content'] 2 | strip_id_or_class: manualnavbar 3 | 4 | prune: no 5 | 6 | test_url: http://www.php.net/manual/en/migration5.incompatible.php -------------------------------------------------------------------------------- /phys.org.txt: -------------------------------------------------------------------------------- 1 | http_header(User-Agent): Mastodon/4.3.2 (http.rb/5.2.0; +https://mastodon.social/) Bot 2 | 3 | test_url: https://phys.org/news/2025-03-dark-universe-telescope.html 4 | test_url: https://phys.org/rss-feed/breaking/space-news/ 5 | -------------------------------------------------------------------------------- /pinterest.com.txt: -------------------------------------------------------------------------------- 1 | title: //title 2 | body: //div[contains(@class, 'imageContainer')] 3 | 4 | test_url: http://pinterest.com/pin/380906080954441188/ 5 | test_url: http://pinterest.com/michaelsorm/architecture.rss 6 | -------------------------------------------------------------------------------- /pixellibre.net.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class="entry-title"] 2 | author: //a[@class='url fn n'] 3 | 4 | test_url: https://pixellibre.net/2017/10/vie-privee-smartphones-applications/ 5 | -------------------------------------------------------------------------------- /pjmedia.com.txt: -------------------------------------------------------------------------------- 1 | find_string:display:none 2 | replace_string: .. 3 | 4 | single_page_link: //div[@class='single-page-button']//a 5 | 6 | test_url: https://pjmedia.com/eddriscoll/2016/08/31/tom-wolfe-kingdom-of-speech/ 7 | -------------------------------------------------------------------------------- /plzkthxbai.com.txt: -------------------------------------------------------------------------------- 1 | title: //h2[@class='jcw-pagetitle' 2 | date: //p[@class='postinfo'] 3 | body: //div[@class='contenttext'] 4 | test_url: http://plzkthxbai.com/blog/2011/06/28/1password-and-internet-security/ -------------------------------------------------------------------------------- /pmf.silvrback.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' all_external_links ')] 2 | test_url: https://pmf.silvrback.com/fixing-tethering-on-android-kitkat -------------------------------------------------------------------------------- /pogue.blogs.nytimes.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id="content"]/div[1] 2 | 3 | title: //h1[@class="entry-title"] 4 | test_url: http://pogue.blogs.nytimes.com/2011/05/12/the-future-of-skype/ -------------------------------------------------------------------------------- /politifact.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id="content"] 2 | 3 | strip: //div[@class="pfcontentmid"]/div[position()>4]|//div[@class="pfad"] 4 | test_url: http://www.politifact.com/truth-o-meter/statements/2011/may/30/barbara-boxer/barbara-boxer-says-medicare-overhead-far-lower-pri/ -------------------------------------------------------------------------------- /popehat.com.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class='entry-title'] 2 | author: //div[@class='entry-author'] 3 | date: //div[@class='entry-time'] 4 | body: //div[@class='entry-content'] 5 | 6 | test_url: https://popehat.com/2015/12/16/eric-posner-the-first-amendments-nemesis/ 7 | -------------------------------------------------------------------------------- /portertech.ca.txt: -------------------------------------------------------------------------------- 1 | author: //*[(@class = "author")] 2 | date: //*[(@class = "date")] 3 | test_url: http://portertech.ca/2012/12/10/iac-morning-market/ -------------------------------------------------------------------------------- /prolost.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='body'] 2 | title: //h2[@class='title'] 3 | date: //span[@class='posted-on'] 4 | test_url: http://prolost.com/blog/2011/10/13/real-men-comp-with-film.html -------------------------------------------------------------------------------- /propakistani.pk.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' content-post ')] 2 | test_url: https://propakistani.pk/2017/06/23/eid-mubarak-happy-holidays-everyone/ 3 | test_contains: away from work for Eid Holidays 4 | -------------------------------------------------------------------------------- /proskauer.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'article-content__copy')] 2 | strip: //section[@id='cookie'] 3 | 4 | insert_detected_image: no 5 | 6 | test_url: https://www.proskauer.com/pub/launching-a-hedge-fund-in-a-crisis 7 | -------------------------------------------------------------------------------- /protonmail.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class="entry-title"] 2 | author: //header[@class="entry-header"]//a[@class="url fn n"] 3 | 4 | strip: //div[@class="csbtns"] 5 | 6 | test_url: https://protonmail.com/blog/biometric-authentication/ 7 | -------------------------------------------------------------------------------- /publications.parliament.uk.txt: -------------------------------------------------------------------------------- 1 | author: //meta[@name="Author"] 2 | date: //meta[@name="Date"] 3 | strip: //h5 4 | test_url: http://www.publications.parliament.uk/pa/ld201011/ldhansrd/text/111109-0003.htm -------------------------------------------------------------------------------- /pxlnv.com.txt: -------------------------------------------------------------------------------- 1 | date: //main//time/@datetime 2 | 3 | test_url: https://pxlnv.com/blog/bullshit-web/ 4 | -------------------------------------------------------------------------------- /pymotw.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[starts-with(@id, 'module-')] 2 | 3 | test_url: https://pymotw.com/3/configparser/ 4 | test_url: https://pymotw.com/3/shlex/ 5 | test_url: https://pymotw.com/3/sys/ 6 | -------------------------------------------------------------------------------- /python.org.txt: -------------------------------------------------------------------------------- 1 | body: //article[contains(concat(' ',normalize-space(@class),' '),' text ')] 2 | 3 | test_url: https://www.python.org/about/success/cog/ 4 | -------------------------------------------------------------------------------- /queerty.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='copy'] 2 | title: //h1[@class='hed'] 3 | test_url: http://www.queerty.com/rawhide-radicals-meet-five-heroes-from-the-leather-community-20120302/ -------------------------------------------------------------------------------- /rachelandrew.co.uk.txt: -------------------------------------------------------------------------------- 1 | date: //time/@datetime 2 | 3 | strip: //aside[@class="article-meta"] 4 | strip: //div[@class="keep-in-touch"] 5 | 6 | test_url: https://www.rachelandrew.co.uk/archives/2019/01/30/html-css-and-our-vanishing-industry-entry-points/ 7 | -------------------------------------------------------------------------------- /racjonalista.pl.txt: -------------------------------------------------------------------------------- 1 | author: /html/body/center/b 2 | date: /html/body/table/tr[2]/td/i 3 | single_page_link: //*[@id='oTxt']/table[3]/tr[2]/td/a[1] 4 | 5 | test_url: http://www.racjonalista.pl/kk.php/s,7214/q,Geneza.szubrawstwa -------------------------------------------------------------------------------- /radar.oreilly.com.txt: -------------------------------------------------------------------------------- 1 | date://span[@class='date'] 2 | body://div[@class='entry-body'] 3 | test_url: http://radar.oreilly.com/2012/01/genome-cloud-digital-humanities-hadoop-world-strata.html -------------------------------------------------------------------------------- /radionz.co.nz.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='body'] 2 | title: //div[@class='newsstory']/h2 3 | test_url: http://www.radionz.co.nz/news/stories/2010/07/18/12481029a86d -------------------------------------------------------------------------------- /radishzz.cc.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' article-content ')] 2 | 3 | prune: no 4 | 5 | test_url: https://radishzz.cc/posts/384776b2/ 6 | -------------------------------------------------------------------------------- /rancher.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' wrap ')] 2 | 3 | test_url: https://rancher.com/blog/2019/2019-03-21-comparing-kubernetes-cni-providers-flannel-calico-canal-and-weave/ 4 | -------------------------------------------------------------------------------- /rasgolatente.es.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class='entry-title'] 2 | author: //div[@class='entry-author'] 3 | date: //div[@class='entry-time'] 4 | body: //div[@class='entry-content'] 5 | 6 | test_url: http://rasgolatente.es/estupidez-psicologia-estupidos/ 7 | -------------------------------------------------------------------------------- /reactjs.org.txt: -------------------------------------------------------------------------------- 1 | body: //article 2 | 3 | strip: //header 4 | strip: //aside 5 | 6 | prune: no 7 | 8 | test_url: https://reactjs.org/docs/uncontrolled-components.html 9 | -------------------------------------------------------------------------------- /real.gr.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'article-photo-wrapper')] 2 | prune: no 3 | 4 | test_url: http://www.real.gr/DefaultArthro.aspx?page=arthro&id=360962&catID=1 5 | test_contains: Επισήμως το αποψινό υπουργικό 6 | -------------------------------------------------------------------------------- /redalemeden.com.txt: -------------------------------------------------------------------------------- 1 | author: //header//h1[@class="full-name"] 2 | date: //div[@class="post-metadata"]//time/@date 3 | 4 | test_url: https://redalemeden.com/blog/2019/we-need-chrome-no-more 5 | -------------------------------------------------------------------------------- /redmas.com.co.txt: -------------------------------------------------------------------------------- 1 | http_header(user-agent): Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:122.0) Gecko/20100101 Firefox/122.0 2 | 3 | test_url: https://redmas.com.co/tecnologia/Clientes-prepago-pospago-y-hogar-de-Claro-tendran-acceso-sin-costo-a-100-GB-en-la-nube-20231004-0032.html 4 | -------------------------------------------------------------------------------- /redtimmy.com.txt: -------------------------------------------------------------------------------- 1 | title: //h4[@class='entry-title'] 2 | body: //div[@class='post-content'] 3 | 4 | test_url: https://www.redtimmy.com/docker/a-tale-of-escaping-a-hardened-docker-container/ 5 | -------------------------------------------------------------------------------- /renenekuda.cz.txt: -------------------------------------------------------------------------------- 1 | title: //*[@class='entry-title'] 2 | body: //div[@class='entry-content'] 3 | test_url: http://www.renenekuda.cz/recept-na-produktivitu/ -------------------------------------------------------------------------------- /renverse.co.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'article-texte')] 2 | 3 | prune: no 4 | 5 | test_url: https://renverse.co/infos-locales/article/rejoignez-la-zad-du-geissberg-3486 6 | -------------------------------------------------------------------------------- /researchandmarkets.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' order-description-container ')] 2 | 3 | prune: no 4 | 5 | test_url: https://www.researchandmarkets.com/reports/5264361/retail-point-of-sale-market-by-product-fixed 6 | -------------------------------------------------------------------------------- /resilience.org.txt: -------------------------------------------------------------------------------- 1 | # Article's main content 2 | body: //section[@class="post-content"] 3 | 4 | # A test URL, e.g. the article you used to write the file 5 | test_url: https://www.resilience.org/stories/2021-10-14/rural-resilience-all-in-good-time/ 6 | -------------------------------------------------------------------------------- /retractionwatch.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[contains(concat(' ',normalize-space(@class),' '),' entry-content ')] 3 | test_url: https://retractionwatch.com/2018/07/30/how-institutions-gaslight-whistleblowers-and-what-can-be-done/ 4 | -------------------------------------------------------------------------------- /retro-games.fr.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //link[@rel='amphtml'] 2 | 3 | test_url: https://www.retro-games.fr/shadow-hearts-ps2-7476 4 | 5 | -------------------------------------------------------------------------------- /revdennismccarty.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' entry-content ')] 2 | 3 | prune: no 4 | 5 | test_url: https://revdennismccarty.com/understanding-gadflies-as-ga-approaches/ 6 | -------------------------------------------------------------------------------- /rezeptwelt.de.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='step-content'] | //div[@class='global-active ingredients-box'] 2 | title: //div[@class='step-1-container'] 3 | 4 | tidy: no 5 | test_url: http://www.rezeptwelt.de/backen-herzhaft-rezepte/w%C3%BCrstchen-schlangen/530372 -------------------------------------------------------------------------------- /riffreporter.de.txt: -------------------------------------------------------------------------------- 1 | body: //article 2 | strip: //svg 3 | prune: no 4 | 5 | test_url: https://www.riffreporter.de/de/wissen/klimakrise-artensterben-biodiversitaet-droht-sechstes-massenaussterben 6 | -------------------------------------------------------------------------------- /rnd.de.txt: -------------------------------------------------------------------------------- 1 | body: //article/div[contains(concat(' ',normalize-space(@class),' '),' a__in ')] 2 | 3 | strip_id_or_class: a__rel-a-li 4 | strip_id_or_class: ord--0 5 | strip_id_or_class: a-hd__aut 6 | -------------------------------------------------------------------------------- /robertsspaceindustries.com.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: 'sharedaddy' 2 | strip_id_or_class: 'respond' 3 | strip_id_or_class: 'meta' 4 | test_url: http://www.robertsspaceindustries.com/news-update-ai-pilots/ -------------------------------------------------------------------------------- /robots.thoughtbot.com.txt: -------------------------------------------------------------------------------- 1 | body: //section[@class='post text'] 2 | title: //h1[@class='title'] 3 | date: //p[@class='post-date'] 4 | strip: //section[@class='meta-info'] 5 | test_url: http://robots.thoughtbot.com/post/32455387133/four-phase-test -------------------------------------------------------------------------------- /rom-game.fr.txt: -------------------------------------------------------------------------------- 1 | author: //div[@id="main"]//a[contains(@href, "/auteurs/")] 2 | date: //meta[@itemprop="datePublished"]/@content 3 | 4 | test_url: https://www.rom-game.fr/news/3371-Goldeneye+007+devient+Goldeneye+25.html 5 | -------------------------------------------------------------------------------- /roomescapeartist.com.txt: -------------------------------------------------------------------------------- 1 | prune: no 2 | 3 | strip: //svg 4 | 5 | test_url: https://roomescapeartist.com/2020/05/18/locked-amsterdam-submarine-hivemind-review/ 6 | -------------------------------------------------------------------------------- /roughtype.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='content'] 2 | strip: //p[@class='postmeta']/following::* 3 | strip: //p[@class='postmeta'] 4 | strip: //p[@align='left'] 5 | test_url: http://www.roughtype.com/archives/2012/01/power_to_the_da.php -------------------------------------------------------------------------------- /roy.gbiv.com.txt: -------------------------------------------------------------------------------- 1 | strip_comments: no 2 | test_url: http://roy.gbiv.com/untangled/2008/rest-apis-must-be-hypertext-driven -------------------------------------------------------------------------------- /rpgsite.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='news-text'] 2 | prune: no 3 | test_url: http://www.rpgsite.net/news/1964-tetsuya-nomura-says-hell-soon-show-the-future-of-final-fantasy 4 | test_url: http://www.rpgsite.net/news/1965-new-atelier-totori-plus-screens-and-artwork -------------------------------------------------------------------------------- /ruhlman.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class='entry-title'] 2 | author: ///span[@class='author vcard'] 3 | date: //abbr[@class='published'] 4 | body: //div[@class='entry-content'] 5 | 6 | test_url: http://ruhlman.com/2009/05/cookbooks-that-teach/ -------------------------------------------------------------------------------- /rust-lang-nursery.github.io.txt: -------------------------------------------------------------------------------- 1 | body: //main 2 | 3 | test_url: https://rust-lang-nursery.github.io/rust-cookbook/web/clients/apis.html 4 | -------------------------------------------------------------------------------- /saltyworld.net.txt: -------------------------------------------------------------------------------- 1 | body: //article[contains(@class, 'hentry')] 2 | 3 | prune: no 4 | # remove related 5 | strip_id_or_class: relpost 6 | 7 | test_url: https://saltyworld.net/contrapoints/ 8 | -------------------------------------------------------------------------------- /sayidaty.net.txt: -------------------------------------------------------------------------------- 1 | date: //meta[@property='article:published_time']/@content 2 | body: (//div[contains(@class, 'article-slider')]//img)[1] | //div[contains(@class, 'bottom-article-con')] 3 | 4 | test_url: http://www.sayidaty.net/taxonomy/term/10/all/feed -------------------------------------------------------------------------------- /scinfolex.com.txt: -------------------------------------------------------------------------------- 1 | author: //div[@class="entry-meta"]//a[contains(@class, "url")] 2 | 3 | test_url: https://scinfolex.com/2018/09/15/la-directive-copyright-nest-pas-une-defaite-pour-linternet-libre-et-ouvert/ 4 | -------------------------------------------------------------------------------- /scnsrc.me.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='storycontent'] 2 | tidy: no 3 | test_url: http://www.scnsrc.me/assassins-creed-2016-720p-bluray-x264-sparks/ 4 | replace_string(height="240"): width="240" height="240" 5 | -------------------------------------------------------------------------------- /scotthelme.co.uk.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='post-content'] 2 | 3 | test_url: https://scotthelme.co.uk/can-you-get-pwned-with-css/ -------------------------------------------------------------------------------- /scottohara.me.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | author: "Scott O'Hara" 3 | date: //time[@itemprop="datePublished"]/@datetime 4 | 5 | test_url: https://www.scottohara.me/blog/2019/01/21/how-do-you-figure.html 6 | -------------------------------------------------------------------------------- /sdxcentral.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='entry-content'] 2 | author: //div[@class='entry-byline']//a[@class='entry-author'] 3 | strip: //aside 4 | 5 | test_url: https://www.sdxcentral.com/articles/news/pandemic-muddles-sd-wan-supply-chain/2020/05/ 6 | -------------------------------------------------------------------------------- /searchenginejournal.com.txt: -------------------------------------------------------------------------------- 1 | strip: //ul[contains(@id, "social")] 2 | strip: //div[contains(@class, "ts-fab-wrapper")] 3 | strip: //div[contains(@id, 'gpt-ad')] 4 | 5 | test_url: http://www.searchenginejournal.com/web-design-vs-seo-it-doesnt-make-much-sense/62294/ 6 | -------------------------------------------------------------------------------- /seattletransitblog.com.txt: -------------------------------------------------------------------------------- 1 | title: //h3[@class="storytitle"] 2 | date: //div[@class='meta'] 3 | body: //div[@class='storycontent'] 4 | 5 | test_url: http://seattletransitblog.com/2012/06/19/times-st-louis-interested-in-buying-waterfront-streetcars/ -------------------------------------------------------------------------------- /sfweekly.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'content_body')] 2 | strip_id_or_class: det_rel 3 | test_url: http://www.sfweekly.com/2012-03-14/news/cia-lsd-wayne-ritchie-george-h-white-mk-ultra/ -------------------------------------------------------------------------------- /shahinkalantari.com.txt: -------------------------------------------------------------------------------- 1 | body: //main 2 | 3 | # force right-to-left text orientation, needed for wallabag 4 | find_string:
): 2 | replace_string(): 3 | 4 | test_url: https://www.slrlounge.com/flash-outdoors-ambient-balancing-natural/ 5 | -------------------------------------------------------------------------------- /smarthomebeginner.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' inner-post-entry ')] 2 | 3 | test_url: https://www.smarthomebeginner.com/docker-home-media-server-2018-basic/ 4 | -------------------------------------------------------------------------------- /sme.sk.txt: -------------------------------------------------------------------------------- 1 | title: //meta[@property='og:title']/@content 2 | date: //p[@class='autor_line']/b/text() 3 | test_url: http://www.sme.sk/c/6268206/lipsic-vidi-malcharkove-uplatky.html -------------------------------------------------------------------------------- /snip.ly.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //meta[@property="og:url"]/@content 2 | 3 | test_url: http://snip.ly/qa1R -------------------------------------------------------------------------------- /snob.ru.txt: -------------------------------------------------------------------------------- 1 | body: //article[contains(concat(' ',normalize-space(@class),' '),' entry__body ')] 2 | 3 | strip_id_or_class: entry__tags 4 | strip_id_or_class: entry__likes 5 | 6 | prune: no 7 | 8 | test_url: https://snob.ru/society/masony-v-lozhe-i-vokrug-nee-chast-1/ 9 | -------------------------------------------------------------------------------- /soundcity.tv.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: sharing 2 | 3 | test_url: http://soundcity.tv/feed/ 4 | -------------------------------------------------------------------------------- /soundonsound.com.txt: -------------------------------------------------------------------------------- 1 | body: //article[@role="article"] 2 | prune: no 3 | 4 | test_url: https://www.soundonsound.com/people/massive-attacks-new-studio 5 | test_contains: We usually start with a few basic ideas 6 | -------------------------------------------------------------------------------- /sourcebooks.com.txt: -------------------------------------------------------------------------------- 1 | #grab the actual content div 2 | body: //div[@class='rt-article'] 3 | 4 | test_url: http://www.sourcebooks.com/blog/happy-27th-birthday-sourcebooks.html 5 | -------------------------------------------------------------------------------- /spectrejournal.com.txt: -------------------------------------------------------------------------------- 1 | body: //main 2 | 3 | prune: no 4 | 5 | strip_id_or_class: elementor-widget-share-buttons 6 | 7 | test_url: https://spectrejournal.com/roundtable-on-china/ 8 | test_contains: I know you write in pretty mainstream media 9 | -------------------------------------------------------------------------------- /spiderum.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' editor ')] 2 | 3 | prune: no 4 | 5 | test_url: https://spiderum.com/bai-dang/Dung-luot-mang-xa-hoi-trong-thoi-gian-ranh-nua-Hay-lam-5-dieu-nay-PvXeTJ9tAR3D 6 | -------------------------------------------------------------------------------- /spin.com.txt: -------------------------------------------------------------------------------- 1 | tidy: no 2 | body: //section[contains(@class, 'main')] 3 | strip: //footer 4 | strip: //a[@class='paginated'] 5 | test_url: http://www.spin.com/articles/bathlands-deep-heart-americas-new-drug-nightmare -------------------------------------------------------------------------------- /splinternews.com.txt: -------------------------------------------------------------------------------- 1 | title: //head/title 2 | author: //meta[@name="author"]/@content 3 | body: //div[contains(@class, 'post-content')] 4 | strip: //div[contains(@class, 'content-summary')] 5 | 6 | test_url: https://splinternews.com/jonathan-chait-has-no-excuse-1831076209 7 | -------------------------------------------------------------------------------- /sports.ru.txt: -------------------------------------------------------------------------------- 1 | title: //meta[@property="twitter:title"]/@content 2 | date: //time/@datetime 3 | 4 | test_url: https://www.sports.ru/football/blogs/3326825.html 5 | -------------------------------------------------------------------------------- /sprengsatz.de.txt: -------------------------------------------------------------------------------- 1 | title: //h2 2 | author: string('Michael Spreng') 3 | date: //div[@class='date'] 4 | body: //div[@class='entry'] 5 | test_url: http://www.sprengsatz.de/?p=3691 -------------------------------------------------------------------------------- /sqlite.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='ff-body'] 2 | 3 | replace_string(

):

4 | 5 | prune: no 6 | 7 | test_url: http://www.sqlite.org/fileformat2.html -------------------------------------------------------------------------------- /squashed.tumblr.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='content'] 2 | date: substring-before( //div[@class='unit dateAndNotes'], 'with') 3 | title: //h3 4 | test_url: http://squashed.tumblr.com/post/17613522228/lets-stop-blaming-the-victims-of-predatory-lending -------------------------------------------------------------------------------- /stadt-muenster.de.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='inhalts-spalte'] 2 | prune: no 3 | strip: //div[@class='footerlinks'] 4 | test_url: https://www.stadt-muenster.de/immobilien/wohnbaupotenzialflaechen/sozialgerechte-bodennutzung.html 5 | -------------------------------------------------------------------------------- /staltz.com.txt: -------------------------------------------------------------------------------- 1 | author: //h2[@class="name-title"] 2 | 3 | test_url: https://staltz.com/a-plan-to-rescue-the-web-from-the-internet.html 4 | -------------------------------------------------------------------------------- /stefanjudis.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@class="c-markdown"] 3 | date: (//dl[@class="c-pageDetails"]//time[@class="c-prettyDate"]/@datetime)[1] 4 | 5 | test_url: https://www.stefanjudis.com/today-i-learned/css-content-accepts-alternative-text/ 6 | -------------------------------------------------------------------------------- /stjv.fr.txt: -------------------------------------------------------------------------------- 1 | date: //time[contains(@class, 'published')]/@datetime 2 | 3 | test_url: https://www.stjv.fr/2018/01/au-sujet-quantic-dream/ 4 | -------------------------------------------------------------------------------- /stopgame.ru.txt: -------------------------------------------------------------------------------- 1 | body: //section[contains(concat(' ',normalize-space(@class),' '),' article ')] 2 | 3 | test_url: https://stopgame.ru/show/113377/phoenotopia_awakening_review 4 | -------------------------------------------------------------------------------- /stumbleupon.com.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //iframe[@id='tb-stumble-frame']/@src 2 | 3 | test_url: http://www.stumbleupon.com/su/35V0wB/zouchmagazine.com/poetry-violet/ -------------------------------------------------------------------------------- /summitroute.com.txt: -------------------------------------------------------------------------------- 1 | prune: no 2 | 3 | test_url: https://summitroute.com/blog/2015/12/24/instagram_bounty_case_study_for_defense/ 4 | -------------------------------------------------------------------------------- /swcarpentry.github.io.txt: -------------------------------------------------------------------------------- 1 | body: //article 2 | 3 | prune: no 4 | 5 | test_url: https://swcarpentry.github.io/shell-novice/02-filedir/index.html 6 | -------------------------------------------------------------------------------- /tbray.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='centercontent'] 2 | strip: //div[@id='rightcontent'] 3 | date: substring-before( //div[@id='cats'], '·') 4 | title: //h1 5 | test_url: http://www.tbray.org/ongoing/When/201x/2012/03/04/Mobile-Money -------------------------------------------------------------------------------- /techcommunity.microsoft.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' lia-message-body-content ')] 2 | 3 | test_url: https://techcommunity.microsoft.com/t5/Azure-Active-Directory-Identity/Your-Pa-word-doesn-t-matter/ba-p/731984 4 | -------------------------------------------------------------------------------- /techmeme.com.txt: -------------------------------------------------------------------------------- 1 | single_page_link_in_feed: //b/a 2 | 3 | test_url: http://www.techmeme.com/feed.xml 4 | -------------------------------------------------------------------------------- /techno-science.net.txt: -------------------------------------------------------------------------------- 1 | title://div[@class="news"]/div[@class="titre"] 2 | body://div[@class="news"]/div[@class="texte"] 3 | test_url: http://www.techno-science.net/?onglet=news&news=14808 4 | -------------------------------------------------------------------------------- /techpinions.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class="post"] 2 | 3 | strip: //div[@class="post-meta"] 4 | strip: //div[@id="socialicons"] 5 | strip: //div[@id="authorbox"] 6 | 7 | test_url: http://techpinions.com/why-google-and-microsoft-hate-siri/3572 -------------------------------------------------------------------------------- /terrestres.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' td-post-content ')] 2 | 3 | strip_id_or_class: td-tags 4 | 5 | test_url: https://www.terrestres.org/2020/06/04/lutter-avec-le-droit-contre-les-derives-de-letat-durgence-sanitaire/ 6 | -------------------------------------------------------------------------------- /the-magazine.org.txt: -------------------------------------------------------------------------------- 1 | tidy: no 2 | 3 | test_url: http://the-magazine.org/1/alone-together-again -------------------------------------------------------------------------------- /the-tls.co.uk.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'tls-article-body')] 2 | 3 | test_url: https://www.the-tls.co.uk/articles/katrina-history-1915-2015-andy-horowitz-review-peter-coates/ 4 | -------------------------------------------------------------------------------- /thebaffler.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='pico'] 2 | 3 | strip_id_or_class: wp-block-pullquote 4 | 5 | test_url: https://thebaffler.com/latest/hong-kong-literatures-growing-pains-chu 6 | -------------------------------------------------------------------------------- /thecounter.org.txt: -------------------------------------------------------------------------------- 1 | body: //section[@id="main-article-content"] 2 | 3 | strip_id_or_class: article-pullquote 4 | strip_id_or_class: hide-on-amp 5 | 6 | prune: no 7 | 8 | test_url: https://thecounter.org/familiar-refrain-united-farm-workers-grapples-how-grow-ufw/ 9 | -------------------------------------------------------------------------------- /thefilmexperience.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='body'] 2 | test_url: http://thefilmexperience.net/blog/2011/12/30/distant-relatives-2001-a-space-odyssey-and-the-tree-of-life.html -------------------------------------------------------------------------------- /theintercept.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class="Headline"] 2 | body: //div[@class="PostContent"] 3 | 4 | test_url: https://theintercept.com/2014/10/30/inside-story-matt-taibbis-departure-first-look-media/ 5 | -------------------------------------------------------------------------------- /thenetworkgarden.blogs.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id="beta-inner"] 2 | title: //h3[@class="entry-header"] 3 | 4 | test_url: http://thenetworkgarden.blogs.com/weblog/2011/09/microsoft-metro-and-the-next-wave-in-computing.html -------------------------------------------------------------------------------- /thenews.coop.txt: -------------------------------------------------------------------------------- 1 | body: //div[@itemprop='articleBody'] 2 | 3 | test_url: http://www.thenews.coop/98221/news/co-operatives/jeremy-corbyn-needs-co-op-movement/ 4 | -------------------------------------------------------------------------------- /theoaklandpress.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='fullstory'] 2 | strip: //div[@id='page_leftbar'] 3 | test_url: http://theoaklandpress.com/articles/2011/04/25/news/doc4db5330e0bce9220005852.txt -------------------------------------------------------------------------------- /theodinproject.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' lesson-content ')] 2 | 3 | prune: no 4 | 5 | test_url: https://www.theodinproject.com/lessons/foundations-command-line-basics 6 | -------------------------------------------------------------------------------- /thepointmag.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='article'] 2 | strip_id_or_class: z-max 3 | strip_id_or_class: readLaterMenu 4 | 5 | test_url: https://thepointmag.com/2016/examined-life/can-liberal-education-save-the-sciences 6 | -------------------------------------------------------------------------------- /therumpus.net.txt: -------------------------------------------------------------------------------- 1 | title: /html/body/div/div[2]/div/div/h1 2 | 3 | body: /html/body/div/div[2]/div/div/div[2] 4 | test_url: http://therumpus.net/2010/07/the-rumpus-interview-with-david-means/?full=yes -------------------------------------------------------------------------------- /theses.enc.sorbonne.fr.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class="head"] 2 | author: //div[@class="name"] 3 | body: //article[@id="text"] 4 | 5 | test_url: http://theses.enc.sorbonne.fr/2014/sidre 6 | -------------------------------------------------------------------------------- /thesimpledollar.com.txt: -------------------------------------------------------------------------------- 1 | title: //h3[@class='post-title']/a[@class='post-title-link'] 2 | body: //div[@class='post-content'] 3 | author: //div[@class='post-meta-under-title']/a 4 | test_url: http://www.thesimpledollar.com/2011/09/13/determining-the-size-of-your-emergency-fund/ -------------------------------------------------------------------------------- /thesocialitefamily.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' strates-single ')] 2 | 3 | test_url: https://www.thesocialitefamily.com/familles/mulhouse/chez-anne-hubert-la-cerise-sur-le-gateau/ 4 | -------------------------------------------------------------------------------- /theteaspot.com.txt: -------------------------------------------------------------------------------- 1 | body: //main[@id='MainContent'] 2 | 3 | prune: no 4 | 5 | test_url: https://www.theteaspot.com/pages/about-tea 6 | -------------------------------------------------------------------------------- /thethaovanhoa.vn.txt: -------------------------------------------------------------------------------- 1 | strip:/html/body/form/div[2]/div[3]/div/div/div/div/div/div/div/div/div/div[2]/div[3]/div[2]/div/p[2] 2 | test_url: http://thethaovanhoa.vn/151N20110519085606745T129/levante-quyet-giu-caicedo.htm -------------------------------------------------------------------------------- /thewirecutter.com.txt: -------------------------------------------------------------------------------- 1 | body: //main/div/article 2 | 3 | strip: //header 4 | strip: //aside 5 | 6 | author: //p[@data-scp="author_name"] 7 | date: //time/@datetime 8 | 9 | test_url: https://thewirecutter.com/money/credit-cards/ 10 | -------------------------------------------------------------------------------- /thingiverse.com.txt: -------------------------------------------------------------------------------- 1 | tidy: yes 2 | autodetect_on_failure: yes 3 | prune: yes 4 | body: /html/head/title 5 | 6 | test_url: https://www.thingiverse.com/thing:3868321 7 | test_contains: Panther Origami -------------------------------------------------------------------------------- /thinkspot.com.txt: -------------------------------------------------------------------------------- 1 | # This only appears after JS is processed 2 | body: //div[contains(@class, 'desc_div')] 3 | 4 | insert_detected_image: no 5 | 6 | prune: no 7 | 8 | test_url: https://www.thinkspot.com/discourse/OJumEP/post/spencer-t-folmar/telling-stories-that-liberate/9YtZ6zl 9 | -------------------------------------------------------------------------------- /thisamericanlife.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content'] 2 | 3 | test_url: https://www.thisamericanlife.org/282/transcript 4 | test_contains: I was part of sending an innocent man to jail 5 | -------------------------------------------------------------------------------- /tidbits.com.txt: -------------------------------------------------------------------------------- 1 | author: //span[@class='fn'] 2 | date: substring-before(substring-after(//*[@id='center_ajax_sub']/div/div[3],'|'),'|') 3 | test_url: http://tidbits.com/article/12651 -------------------------------------------------------------------------------- /tijd.be.txt: -------------------------------------------------------------------------------- 1 | strip: //div[@class="ac_paragraph-hidden"] 2 | 3 | test_url: https://www.tijd.be/politiek-economie/internationaal/algemeen/ik-ben-vooral-bezorgd-dat-corona-uitbreekt-in-afrika/10204834.html 4 | test_contains: U klinkt gealarmeerder 5 | -------------------------------------------------------------------------------- /timeshighereducation.co.uk.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@class="storytext"] 3 | strip: //div[@id="thelogin"] 4 | strip: //*[@class="hide"] 5 | strip: //div[@id="anchored"] 6 | test_url: http://www.timeshighereducation.co.uk/story.asp?sectioncode=26&storycode=416124&c=1 -------------------------------------------------------------------------------- /timeshighereducation.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class="col-md-12 radix-layouts-contentheader panel-panel"] 2 | strip: //div[@class="htmlContent subscribe_box"] 3 | test_url: https://www.timeshighereducation.com/blog/jeremy-corbyn-serious-about-free-higher-education 4 | -------------------------------------------------------------------------------- /tldp.org.txt: -------------------------------------------------------------------------------- 1 | title: //title 2 | body: //h2 | //p | //ul 3 | prune: no 4 | tidy: no 5 | 6 | test_url: http://www.tldp.org/HOWTO/Plug-and-Play-HOWTO-7.html -------------------------------------------------------------------------------- /tofugu.com.txt: -------------------------------------------------------------------------------- 1 | body://div[@class='entry-content'] 2 | 3 | test_url: http://www.tofugu.com/2015/07/20/interview-with-toriena-japanese-chiptune/ 4 | -------------------------------------------------------------------------------- /toolinux.com.txt: -------------------------------------------------------------------------------- 1 | title: //h2[contains(@class,'news')] 2 | body: //div[contains(@class,'articleContent')] 3 | date: substring-after(//div[@class = 'SupaDate']/text(), 'le') 4 | 5 | test_url: http://www.toolinux.com/Wi-Fi-Linksys-WRT-la-legende-de 6 | -------------------------------------------------------------------------------- /toolsandtoys.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='post'] 2 | 3 | strip: //div[@class='social'] 4 | strip: //span[@class='next'] 5 | strip: //span[@class='previous'] 6 | test_url: http://toolsandtoys.net/noble-tonic-02/ -------------------------------------------------------------------------------- /touilleur-express.fr.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '), ' post_ctn ')] 2 | 3 | strip_id_or_class: yarpp-related 4 | 5 | test_url: https://www.touilleur-express.fr/2022/03/08/le-chiffrement-de-bout-en-bout-et-la-signature-denveloppe/ -------------------------------------------------------------------------------- /trailer.web-view.net.txt: -------------------------------------------------------------------------------- 1 | title: concat(substring-before(//title,':'),': ',//div[@class='Date2']) 2 | test_url: http://trailer.web-view.net/Show/0XC4EFE5D648B716BA2E134BC7CE61B9CC001E04F11E9434438186735DBD637488.htm -------------------------------------------------------------------------------- /triplebyte.com.txt: -------------------------------------------------------------------------------- 1 | body: //article[contains(concat(' ',normalize-space(@class), ' '), ' blog-post ')] 2 | 3 | test_url: https://triplebyte.com/blog/marissa-mayer-interview 4 | -------------------------------------------------------------------------------- /tthfanfic.org.txt: -------------------------------------------------------------------------------- 1 | title: //h2 2 | author: //a[starts-with(@href, '/AuthorStories')] 3 | body: //div[@id='storyinnerbody'] 4 | test_url: http://www.tthfanfic.org/Story-6512/Kudra+Journeys.htm -------------------------------------------------------------------------------- /tuaw.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class='posttitle'] 2 | author: //span[@class='author']/a 3 | date: //span[@class='timestamp'] 4 | body: //div[@class='body'] 5 | 6 | test_url: http://www.tuaw.com/2011/10/19/apple-posts-fans-memories-of-steve-jobs/ -------------------------------------------------------------------------------- /turnoff.us.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class='post-title'] 2 | body: //article[@class='post-content'] 3 | test_url: https://turnoff.us/geek/the-depressed-developer-13/ 4 | -------------------------------------------------------------------------------- /tvtropes.org.txt: -------------------------------------------------------------------------------- 1 | #The examples are useful - keep 2 | #strip: //div[contains(concat(' ',normalize-space(@class),' '),' folder ')] 3 | #strip: //div[contains(concat(' ',normalize-space(@class),' '),' folderlabel ')] 4 | 5 | test_url: https://tvtropes.org/pmwiki/pmwiki.php/Main/Masquerade 6 | -------------------------------------------------------------------------------- /urbandictionary.com.txt: -------------------------------------------------------------------------------- 1 | title: //title 2 | body: //table[@id='entries'] 3 | test_url: http://www.urbandictionary.com/define.php?term=Grown-Ass 4 | -------------------------------------------------------------------------------- /useit.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | 3 | date: substring-after(//p[@class='overline']/strong, ',') 4 | body: //div[@class="maintext"] 5 | strip: //p[@class='overline'] 6 | strip: //h1 7 | tidy: no 8 | test_url: http://www.useit.com/alertbox/mobile-startup-screen.html -------------------------------------------------------------------------------- /utdailybeacon.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='blox-story-text'] 2 | test_url: http://www.utdailybeacon.com/news/article_ccf6d024-0f15-11e5-ae29-9f63598deb81.html 3 | -------------------------------------------------------------------------------- /utiliser-lightroom.com.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class="titrearticle"] 2 | body: //div[@class="article"] 3 | 4 | test_url: http://www.utiliser-lightroom.com/blog/2019/04/23/skylum-flex-et-airmagic-pour-les-utilisateurs-de-lightroom/ 5 | -------------------------------------------------------------------------------- /ux.artu.tv.txt: -------------------------------------------------------------------------------- 1 | author: ("Arturo Toledo") 2 | title: //div[@class="post"]/h2 3 | body: //div[@class="entry"] 4 | 5 | # Remove Twitter button 6 | strip: //div[@class="entry"]/p[2]/a/img 7 | test_url: http://ux.artu.tv/?p=192 -------------------------------------------------------------------------------- /vakarm.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class="block_news_main_content_preview"] 2 | 3 | test_url: https://www.vakarm.net/news/read/Choual-History-X-tout-un-cinema/10270/2 4 | -------------------------------------------------------------------------------- /valdaiclub.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'dk-entry__body)] 2 | author: //meta[@property="author"]/@content 3 | title: //meta[@property="og:title"]/@content 4 | 5 | prune: no 6 | 7 | test_url: https://valdaiclub.com/a/highlights/do-empires-have-allies/ 8 | -------------------------------------------------------------------------------- /varsity.co.uk.txt: -------------------------------------------------------------------------------- 1 | # FB comments are inside an h2. Weird. Without this, the line 'Comments' is preserved by the text parser 2 | 3 | strip: //h2 4 | test_url: http://www.varsity.co.uk/reviews/2662 -------------------------------------------------------------------------------- /vc.ru.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' l-entry ')] 2 | 3 | strip_id_or_class: l-hidden 4 | strip_id_or_class: l-entry__banner 5 | 6 | test_url: https://vc.ru/finance/128687-60-poleznyh-saytov-dlya-poiska-investiciy-v-startap 7 | -------------------------------------------------------------------------------- /vedonlyonti.com.txt: -------------------------------------------------------------------------------- 1 | strip: //style 2 | 3 | test_url: https://vedonlyonti.com/veikkausvihjeet/pitkavetovihjeet/nba-boston-celtics-cleveland-cavaliers-8-5-2024 4 | -------------------------------------------------------------------------------- /venturebeat.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class="entry-title"] 2 | author: //div[@class="author-name"] 3 | date: //span[@class="the-time"] 4 | body: //div[@class="entry-content"] 5 | strip: //div[@class="vb-gallery"] 6 | test_url: http://venturebeat.com/2012/07/17/marissa-mayer-yahoo/#s:mayer-1 -------------------------------------------------------------------------------- /vg.no.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='artikkelspalte'] 2 | strip_id_or_class: 'breadcrumb' 3 | test_url: http://www.vg.no/spill/artikkel.php?artid=10003628 -------------------------------------------------------------------------------- /viget.com.txt: -------------------------------------------------------------------------------- 1 | body: (//article)[1] 2 | 3 | strip_id_or_class: sharer 4 | 5 | prune: no 6 | 7 | test_url: https://www.viget.com/articles/understanding-futures-in-rust-part-1/ 8 | -------------------------------------------------------------------------------- /visualcapitalist.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@id='mvp-content-main'] | //article//header 3 | 4 | strip_id_or_class: mvp-post-cat 5 | 6 | test_url: https://www.visualcapitalist.com/from-greek-to-latin-visualizing-the-evolution-of-the-alphabet/ 7 | -------------------------------------------------------------------------------- /vitispr.com.txt: -------------------------------------------------------------------------------- 1 | strip: //*[(@id = "ja-search")] 2 | body: //*[(@id = "ja-mainbody")] 3 | body: //*[(@id = "content-mass-bottom")] 4 | strip://h3[contains(span,'Related Posts')] 5 | strip://img 6 | test_url: http://vitispr.com/blog/coventry-is-a-technology-hotspot -------------------------------------------------------------------------------- /vivirmexico.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://vivirmexico.com/2011/09/en-veracruz-arrojan-35-cuerpos-a-plena-luz-del-dia-esta-si-es-una-alarma-social -------------------------------------------------------------------------------- /vk.com.txt: -------------------------------------------------------------------------------- 1 | # use this to avoid meta redirect to badbrowser.php 2 | # user agent will cause a redirect to m.vk.com (mobile version) instead 3 | http_header(user-agent): PHP/7.2 4 | 5 | test_url: https://vk.com/noamchomskyvk?w=wall433994637_327 6 | -------------------------------------------------------------------------------- /voltairenet.org.txt: -------------------------------------------------------------------------------- 1 | title: //h1[contains(concat(' ',normalize-space(@class),' '),' titre_serif_1 ')] 2 | body: //div[contains(concat(' ',normalize-space(@class),' '),' texte_sans ')] 3 | 4 | test_url: http://www.voltairenet.org/article195149.html -------------------------------------------------------------------------------- /vot-tak.tv.txt: -------------------------------------------------------------------------------- 1 | # prevent duplicated images 2 | strip: //img[@fallback] 3 | 4 | test_url: https://vot-tak.tv/novosti/16-08-2021-nevzlin-intervyu/ 5 | -------------------------------------------------------------------------------- /vozpopuli.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@class='mce-body'] 3 | 4 | strip: //aside 5 | 6 | test_url: https://www.vozpopuli.com/opinion/pandemia-racismo-iglesias_0_1365163963.html 7 | test_contains: Ande yo caliente y muérase la gente 8 | -------------------------------------------------------------------------------- /w3.org.txt: -------------------------------------------------------------------------------- 1 | date: //time[@class="entry-date"]/@datetime 2 | 3 | test_url: https://www.w3.org/blog/2019/05/w3c-and-whatwg-to-work-together-to-advance-the-open-web-platform/ 4 | -------------------------------------------------------------------------------- /wallabag.org.txt: -------------------------------------------------------------------------------- 1 | date: //meta[@name="date"]/@content 2 | 3 | test_url: https://wallabag.org/news/20241103-new-release-wallabag-2610/ -------------------------------------------------------------------------------- /warnerbros.fr.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class="article-body"] 2 | test_url: https://www.warnerbros.fr/articles/magic-mike-xxl-adam-rodriguez-portrait 3 | -------------------------------------------------------------------------------- /warriordudimanche.net.txt: -------------------------------------------------------------------------------- 1 | title: //article[contains(concat(' ',normalize-space(@class),' '),' article ')]//header//h1 2 | body: //article[contains(concat(' ',normalize-space(@class),' '),' article ')]//section 3 | 4 | test_url: http://warriordudimanche.net/article458/589065212a599 -------------------------------------------------------------------------------- /watoday.com.au.txt: -------------------------------------------------------------------------------- 1 | # strip the breadcrumb 2 | strip: //div//ul 3 | strip: //aside 4 | strip_id_or_class: adWrapper 5 | strip_id_or_class: noPrint 6 | 7 | test_url: https://www.watoday.com.au/business/the-economy/no-one-died-behind-the-typo-on-the-new-50-note-20190618-p51yqg.html 8 | -------------------------------------------------------------------------------- /web-libre.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='template_article'] 2 | 3 | strip_id_or_class: article_more 4 | strip: //hr 5 | 6 | test_url: http://www.web-libre.org/dossiers/jacuzzi-gonflable,8493.html -------------------------------------------------------------------------------- /web.dev.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, "w-post-content")] 2 | author: //a[@class="w-author__name-link"] 3 | date: //header//time 4 | 5 | strip: //div[@class="w-post-breadcrumbs"] 6 | strip: //div[@class="w-chips"] 7 | 8 | test_url: https://web.dev/content-visibility/ 9 | -------------------------------------------------------------------------------- /wenow.com.txt: -------------------------------------------------------------------------------- 1 | title: //article//h1 2 | 3 | strip: //a[@class="post-previous"] 4 | strip: //aside 5 | 6 | test_url: https://www.wenow.com/2021/06/07/empreinte-carbone-de-la-viande/ 7 | -------------------------------------------------------------------------------- /what-if.xkcd.com.txt: -------------------------------------------------------------------------------- 1 | autodetect_next_page: no 2 | test_url: http://what-if.xkcd.com/1/ -------------------------------------------------------------------------------- /whatever.scalzi.com.txt: -------------------------------------------------------------------------------- 1 | strip: //div[@class="navigation"] 2 | strip: //div[@id="sidebar"] 3 | strip: //div[@id="post-extra-content"] 4 | strip: //div[@id="footer"] 5 | strip: //div[contains(@class, "sharing")] 6 | 7 | test_url: http://whatever.scalzi.com/2011/01/09/quick-giffords-follow-up/ -------------------------------------------------------------------------------- /wiki.guildwars.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@id='content'] 3 | strip_id_or_class: editsection 4 | strip_id_or_class: toc 5 | strip: //div[@id='siteNotice'] 6 | strip: //div[@id='content']//table[last()] 7 | prune: no 8 | test_url: http://wiki.guildwars.com/wiki/Monk -------------------------------------------------------------------------------- /wiki.guildwars2.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@id='content'] 3 | strip_id_or_class: editsection 4 | strip_id_or_class: toc 5 | strip: //div[@id='siteNotice'] 6 | strip: //div[@id='content']//table[last()] 7 | prune: no 8 | test_url: http://wiki.guildwars2.com/wiki/Guardian -------------------------------------------------------------------------------- /wikiwand.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id="fullContent"] 2 | 3 | strip: //div[@data-aaad] 4 | 5 | prune: no 6 | 7 | test_url: https://www.wikiwand.com/en/Maslow%27s_hierarchy_of_needs 8 | test_contains: Personal security 9 | -------------------------------------------------------------------------------- /will-self.com.txt: -------------------------------------------------------------------------------- 1 | strip: //div[@class="widget-area"] 2 | title: //*[@class="entry-title"] 3 | date: //time[@class="entry-date"] 4 | test_url: http://will-self.com/2012/02/01/real-meals-dominos-pizza/ -------------------------------------------------------------------------------- /wmpoweruser.com.txt: -------------------------------------------------------------------------------- 1 | date://*[@class="entry-date"] 2 | author://*[@class="author vcard"] 3 | strip://*[@style="position:relative;left:72px;top:2px;"]|//*[@id="authorbox"] 4 | test_url: http://wmpoweruser.com/breaking-nokia-announces-nfc-support-in-lumia-610-windows-phone-device/ -------------------------------------------------------------------------------- /wochenanzeiger.de.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: kleinertext 2 | strip: //h3[text() = 'Weiterlesen'] 3 | strip: //div[starts-with(@class, 'box') and contains(@class, '_simple')] 4 | 5 | test_url: https://www.wochenanzeiger.de/article/238700.html 6 | 7 | -------------------------------------------------------------------------------- /wordpress.org.txt: -------------------------------------------------------------------------------- 1 | author: //div[@class="meta"]/a[1] 2 | 3 | strip: //div[@class="meta"] 4 | strip: //div[@id="likes-other-gravatars"] 5 | strip: //noscript 6 | 7 | test_url: https://wordpress.org/news/2018/07/update-on-gutenberg/ 8 | -------------------------------------------------------------------------------- /worldwidewords.org.txt: -------------------------------------------------------------------------------- 1 | title: //p[@id='content'] 2 | 3 | body: //div[@class='contentblock'] 4 | test_url: http://www.worldwidewords.org/weirdwords/ww-gro1.htm -------------------------------------------------------------------------------- /wpbeginner.com.txt: -------------------------------------------------------------------------------- 1 | # Required to load the feed properly 2 | http_header(user-agent): Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:98.0) Gecko/20100101 Firefox/98.0 3 | 4 | test_url: https://www.wpbeginner.com/feed/ 5 | -------------------------------------------------------------------------------- /wphive.com.txt: -------------------------------------------------------------------------------- 1 | # Required to load the feed properly 2 | http_header(user-agent): Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:98.0) Gecko/20100101 Firefox/98.0 3 | 4 | test_url: https://www.wphive.com/feed/ 5 | -------------------------------------------------------------------------------- /wpmayor.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='nrelate_flyout_placeholder'] 2 | 3 | strip_id_or_class: share 4 | 5 | prune: no 6 | 7 | test_url: http://www.wpmayor.com/themes/wordpress-portfolio-resume-themes/ 8 | test_url: http://www.wpmayor.com/feed/ -------------------------------------------------------------------------------- /writerunboxed.com.txt: -------------------------------------------------------------------------------- 1 | http_header(User-agent): Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:109.0) Gecko/20100101 Firefox/115.0 2 | 3 | test_url: https://writerunboxed.com/2021/09/23/writerslife-the-411-on-writing-retreats/ 4 | -------------------------------------------------------------------------------- /www.seriouseats.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'recipe-wrapper')] 2 | 3 | test_url: https://www.seriouseats.com/recipes/2014/02/braised-short-ribs-from-daniel.html 4 | -------------------------------------------------------------------------------- /www2.cnrs.fr.txt: -------------------------------------------------------------------------------- 1 | # Site configuration for CNRS press releases 2 | 3 | body: //div[@id="contenu"]//h2[@id="chapeau"] | //div[@id="contenu"]/div[@id="textContenu"] 4 | 5 | test_url: http://www2.cnrs.fr/presse/communique/5327.htm 6 | -------------------------------------------------------------------------------- /wz-newsline.de.txt: -------------------------------------------------------------------------------- 1 | title://h1 2 | 3 | date://p[@class='articleDate'] 4 | body://div[@class='articleBody wzStandardArticle'] 5 | test_url: http://www.wz-newsline.de/home/sport/tennis/federer-zum-vierten-mal-sieger-in-indian-wells-1.938050 -------------------------------------------------------------------------------- /xlsemanal.com.txt: -------------------------------------------------------------------------------- 1 | body: //section[contains(concat(' ',normalize-space(@class),' '),' post-content ')] 2 | 3 | test_url: http://www.xlsemanal.com/firmas/20171126/perez-reverte-el-hombre-que-si-estaba-alli.html 4 | -------------------------------------------------------------------------------- /yosoy.red.txt: -------------------------------------------------------------------------------- 1 | prune: no 2 | 3 | test_url: https://yosoy.red/2021/01/22/politica/ 4 | test_contains: es fundamental entender que los sistemas son creados por humanos 5 | -------------------------------------------------------------------------------- /yostivanich.com.txt: -------------------------------------------------------------------------------- 1 | title://div[@class='entry-title'] 2 | body://div[@class='entry-content'] 3 | strip_comments:yes 4 | convert_double_br_tags:yes 5 | test_url: http://www.yostivanich.com/2010/07/11/wired-com-with-world-watching-wikileaks-falls-into-disrepair/ -------------------------------------------------------------------------------- /yourerie.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@itemprop="articleBody"] 2 | test_url: http://www.yourerie.com/news/news-article/d/story/cd-release-party-at-pi-downs/22898/G_gFL3mSQkWH_DW2wLuMOA 3 | -------------------------------------------------------------------------------- /zaknrw.de.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' single-content ')] 2 | 3 | test_url: http://www.zaknrw.de/medium/audience-development-und-diversitaet 4 | -------------------------------------------------------------------------------- /zataz.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class="blog-title"] 2 | 3 | test_url: https://www.zataz.com/bientot-noel-securisons-le-prochain-pc-de-la-famille/ 4 | -------------------------------------------------------------------------------- /zerokspot.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@id="primarycontent"] 3 | test_url: http://zerokspot.com/weblog/2011/06/26/europython2011/ -------------------------------------------------------------------------------- /zoomit.ir.txt: -------------------------------------------------------------------------------- 1 | body: //div[@itemprop="image" or @itemprop="description" or @itemprop="articleBody"] 2 | 3 | test_url: http://www.zoomit.ir/2017/2/25/152960/tiny-engine-turns-natural-gas-into-hydrogen/ 4 | --------------------------------------------------------------------------------