├── .gitignore ├── _config.yml ├── vendor ├── composer │ ├── installed.json │ ├── autoload_psr4.php │ ├── autoload_classmap.php │ └── autoload_namespaces.php └── autoload.php ├── Procfile ├── site_config ├── standard │ ├── version.txt │ ├── getpocket.com.txt │ ├── feeds.feedblitz.com.txt │ ├── ganglia.info.txt │ ├── autocrypt.org.txt │ ├── index.php │ ├── what-if.xkcd.com.txt │ ├── lukew.com.txt │ ├── soundcity.tv.txt │ ├── crimemagazine.com.txt │ ├── ht.ly.txt │ ├── the-magazine.org.txt │ ├── pxlnv.com.txt │ ├── alex.mullr.net.txt │ ├── chareidi.org.txt │ ├── opensource.org.txt │ ├── snip.ly.txt │ ├── techmeme.com.txt │ ├── blog.fefe.de.txt │ ├── axesslab.com.txt │ ├── bitelia.com.txt │ ├── blog.spu.edu.txt │ ├── ecetia.com.txt │ ├── extracine.com.txt │ ├── help.fivefilters.org.txt │ ├── jjahnke.net.txt │ ├── kumailplus.com.txt │ ├── luxuo.com.txt │ ├── t3n.de.txt │ ├── unherd.com.txt │ ├── zhuanlan.zhihu.com.txt │ ├── facta.co.jp.txt │ ├── mattcutts.com.txt │ ├── meowni.ca.txt │ ├── motorfull.com.txt │ ├── roy.gbiv.com.txt │ ├── 512pixels.net.txt │ ├── apple.news.txt │ ├── elance.com.txt │ ├── getnews.jp.txt │ ├── jamesclear.com.txt │ ├── lostgarden.com.txt │ ├── mbl.is.txt │ ├── n.survol.fr.txt │ ├── acidcow.com.txt │ ├── alseraj.net.txt │ ├── blogs.gnome.org.txt │ ├── kachestvo.ru.txt │ ├── monkeyzen.com.txt │ ├── news.ycombinator.com.txt │ ├── paquier.xyz.txt │ ├── allafrica.com.txt │ ├── carlchenet.com.txt │ ├── doc.wallabag.org.txt │ ├── eternabuenosaires.com.txt │ ├── fakirpresse.info.txt │ ├── fivefilters.org.txt │ ├── fok.nl.txt │ ├── gist.github.com.txt │ ├── gsmarena.com.txt │ ├── indehekken.net.txt │ ├── macdrifter.com.txt │ ├── marksdailyapple.com.txt │ ├── osmand.net.txt │ ├── summitroute.com.txt │ ├── zerokspot.com.txt │ ├── blog.imirhil.fr.txt │ ├── dagogtid.no.txt │ ├── dailydot.com.txt │ ├── drdobbs.com.txt │ ├── flyingmachinestudios.com.txt │ ├── gizmovil.com.txt │ ├── goodfil.ms.txt │ ├── je-suis-papa.com.txt │ ├── staltz.com.txt │ ├── stjv.fr.txt │ ├── appleweblog.com.txt │ ├── dropbox.com.txt │ ├── gihyo.jp.txt │ ├── hiperpop.com.txt │ ├── jungle-world.com.txt │ ├── krone.at.txt │ ├── panic.com.txt │ ├── tofugu.com.txt │ ├── urbandictionary.com.txt │ ├── vg.no.txt │ ├── warnerbros.fr.txt │ ├── zataz.com.txt │ ├── LICENSE.txt │ ├── altfoto.com.txt │ ├── blogs.forbes.com.txt │ ├── brucelawson.co.uk.txt │ ├── cucharasonica.com.txt │ ├── dansdata.com.txt │ ├── hipertextual.com.txt │ ├── interviewmagazine.com.txt │ ├── jvt.me.txt │ ├── phototrend.fr.txt │ ├── portertech.ca.txt │ ├── renenekuda.cz.txt │ ├── usccb.org.txt │ ├── crn.de.txt │ ├── eff.org.txt │ ├── finexpert.e15.cz.txt │ ├── marigold.cz.txt │ ├── news.rub.de.txt │ ├── news.techmeme.com.txt │ ├── pentaxforums.com.txt │ ├── pieria.co.uk.txt │ ├── tldp.org.txt │ ├── gizmologia.com.txt │ ├── happyassassin.net.txt │ ├── iansommerville.com.txt │ ├── iplaysoft.com.txt │ ├── lefilrouge.media.txt │ ├── lupa.cz.txt │ ├── matt.might.net.txt │ ├── monkeyuser.com.txt │ ├── radionz.co.nz.txt │ ├── sivers.org.txt │ ├── thenews.coop.txt │ ├── turnoff.us.txt │ ├── utdailybeacon.com.txt │ ├── worldwidewords.org.txt │ ├── betabeat.com.txt │ ├── cashless.pl.txt │ ├── davidwalsh.name.txt │ ├── democracynow.org.txt │ ├── explosm.net.txt │ ├── freelancer.com.txt │ ├── gauchiste.fr.txt │ ├── hs.fi.txt │ ├── izismile.com.txt │ ├── jobbank.gc.ca.txt │ ├── mein-mmo.de.txt │ ├── mytotalretail.com.txt │ ├── nplusonemag.com.txt │ ├── signal.org.txt │ ├── stumbleupon.com.txt │ ├── www3.imperial.ac.uk.txt │ ├── cooper.com.txt │ ├── hackertarget.com.txt │ ├── juliareda.eu.txt │ ├── kresus.org.txt │ ├── letraslibres.com.txt │ ├── longform.org.txt │ ├── oschina.net.txt │ ├── php.net.txt │ ├── alexduner.com.txt │ ├── archdaily.com.txt │ ├── berlingske.dk.txt │ ├── codeproject.com.txt │ ├── doughellmann.com.txt │ ├── esglobal.org.txt │ ├── fokus.se.txt │ ├── geenstijl.nl.txt │ ├── gold.ac.uk.txt │ ├── ianlewis.org.txt │ ├── nextcloud.com.txt │ ├── sme.sk.txt │ ├── sourcebooks.com.txt │ ├── sprengsatz.de.txt │ ├── thefilmexperience.net.txt │ ├── triplebyte.com.txt │ ├── vivirmexico.com.txt │ ├── w3.org.txt │ ├── www.seriouseats.com.txt │ ├── a11ywithlindsey.com.txt │ ├── blog.eng.xogrp.com.txt │ ├── blog.nightly.mozilla.org.txt │ ├── caffereggio.net.txt │ ├── economie.gouv.fr.txt │ ├── elblogsalmon.com.txt │ ├── lvsl.fr.txt │ ├── marriedtothesea.com.txt │ ├── pastepad.fivefilters.org.txt │ ├── pixellibre.net.txt │ ├── pmf.silvrback.com.txt │ ├── pogue.blogs.nytimes.com.txt │ ├── queerty.com.txt │ ├── theses.enc.sorbonne.fr.txt │ ├── tidbits.com.txt │ ├── viget.com.txt │ ├── yourerie.com.txt │ ├── 9to5mac.com.txt │ ├── cn.engadget.com.txt │ ├── dictionary.reference.com.txt │ ├── ericsuh.com.txt │ ├── f-droid.org.txt │ ├── github.blog.txt │ ├── grumpygamer.com.txt │ ├── hmercer.com.txt │ ├── laughingsquid.com.txt │ ├── lawfareblog.com.txt │ ├── osmc.tv.txt │ ├── radar.oreilly.com.txt │ ├── shahrsakhtafzar.com.txt │ ├── theoaklandpress.com.txt │ ├── thisamericanlife.org.txt │ ├── zaknrw.de.txt │ ├── blogs.reuters.com.txt │ ├── crimethinc.com.txt │ ├── good.is.txt │ ├── highscalability.com.txt │ ├── marketresearchdirect.com.txt │ ├── prolost.com.txt │ ├── redalemeden.com.txt │ ├── techno-science.net.txt │ ├── tthfanfic.org.txt │ ├── web-libre.org.txt │ ├── americanthinker.com.txt │ ├── autoactu.com.txt │ ├── bobbyromeo.com.txt │ ├── code.google.com.txt │ ├── historic-uk.com.txt │ ├── mebedo.de.txt │ ├── mises.org.txt │ ├── pymotw.com.txt │ ├── saltyworld.net.txt │ ├── sfweekly.com.txt │ ├── share.ez.no.txt │ ├── sqlite.org.txt │ ├── varsity.co.uk.txt │ ├── brandingstrategyinsider.com.txt │ ├── brettterpstra.com.txt │ ├── fair.org.txt │ ├── ft.com.txt │ ├── iphonetweak.fr.txt │ ├── m.theregister.co.uk.txt │ ├── motorcyclistonline.com.txt │ ├── publications.parliament.uk.txt │ ├── robertsspaceindustries.com.txt │ ├── scottohara.me.txt │ ├── spectrum.ieee.org.txt │ ├── splitsider.com.txt │ ├── theintercept.com.txt │ ├── therumpus.net.txt │ ├── will-self.com.txt │ ├── 5by5.tv.txt │ ├── bez.es.txt │ ├── catb.org.txt │ ├── hanselman.com.txt │ ├── houstonchronicle.com.txt │ ├── indiehackers.com.txt │ ├── instagr.am.txt │ ├── kathimerini.gr.txt │ ├── labs.mwrinfosecurity.com.txt │ ├── luminous-landscape.com.txt │ ├── mobilenet.cz.txt │ ├── muycomputerpro.com.txt │ ├── okfn.de.txt │ ├── scnsrc.me.txt │ ├── singularityhub.com.txt │ ├── smarthomebeginner.com.txt │ ├── tabletmag.com.txt │ ├── vedomosti.ru.txt │ ├── zoomit.ir.txt │ ├── 43folders.com.txt │ ├── bernama.com.txt │ ├── brooksreview.net.txt │ ├── chomsky.info.txt │ ├── ciperchile.cl.txt │ ├── dcurt.is.txt │ ├── developers.facebook.com.txt │ ├── elmalpensante.com.txt │ ├── indiatimes.com.txt │ ├── openthemagazine.com.txt │ ├── plzkthxbai.com.txt │ ├── scinfolex.com.txt │ ├── toolsandtoys.net.txt │ ├── book.douban.com.txt │ ├── delong.typepad.com.txt │ ├── gameswirtschaft.de.txt │ ├── groups.drupal.org.txt │ ├── informationclearinghouse.info.txt │ ├── itavisen.no.txt │ ├── keyboardmag.com.txt │ ├── kingarthurflour.com.txt │ ├── lifehack.org.txt │ ├── m.xkcd.com.txt │ ├── nj.com.txt │ ├── onlinewelten.com.txt │ ├── parliament.uk.txt │ ├── pinterest.com.txt │ ├── pittsburghpanthers.com.txt │ ├── spin.com.txt │ ├── thethaovanhoa.vn.txt │ ├── trailer.web-view.net.txt │ ├── xlsemanal.com.txt │ ├── amptoons.com.txt │ ├── dadall.info.txt │ ├── linuxnix.com.txt │ ├── mactechnews.de.txt │ ├── marcvidal.net.txt │ ├── moo.nac.uci.edu.txt │ ├── pjmedia.com.txt │ ├── real.gr.txt │ ├── steamcommunity.com.txt │ ├── thenetworkgarden.blogs.com.txt │ ├── thepointmag.com.txt │ ├── ux.artu.tv.txt │ ├── arduino-tutorial.de.txt │ ├── ascarter.net.txt │ ├── buquad.com.txt │ ├── hazlitt.net.txt │ ├── health.com.txt │ ├── histoire-filante.fr.txt │ ├── mesec.cz.txt │ ├── pandodaily.com.txt │ ├── philstar.com.txt │ ├── racjonalista.pl.txt │ ├── rom-game.fr.txt │ ├── tbray.org.txt │ ├── 24a11y.com.txt │ ├── deia.com.txt │ ├── halo.bungie.org.txt │ ├── jandan.net.txt │ ├── singaporeanstocksinvestor.blogspot.com.txt │ ├── slog.thestranger.com.txt │ ├── utiliser-lightroom.com.txt │ ├── www2.cnrs.fr.txt │ ├── cars.com.txt │ ├── gocomics.com.txt │ ├── gurusblog.com.txt │ ├── isource.com.txt │ ├── maitre-eolas.fr.txt │ ├── protonmail.com.txt │ ├── roughtype.com.txt │ ├── ruhlman.com.txt │ ├── wordpress.org.txt │ ├── wz-newsline.de.txt │ ├── 37signals.com.txt │ ├── 7newsbelize.com.txt │ ├── bjango.com.txt │ ├── blog.chriszacharias.com.txt │ ├── blog.twitter.com.txt │ ├── blog.wells.ee.txt │ ├── borderhouseblog.com.txt │ ├── business2community.com.txt │ ├── communities-dominate.blogs.com.txt │ ├── hespress.com.txt │ ├── hometheaterreview.com.txt │ ├── jacobinmag.com.txt │ ├── linux-magazin.de.txt │ ├── manga-news.com.txt │ ├── maxim.com.txt │ ├── nosalty.hu.txt │ ├── palmbeachpost.com.txt │ ├── propakistani.pk.txt │ ├── retractionwatch.com.txt │ ├── shifteleven.com.txt │ ├── techpinions.com.txt │ ├── thewirecutter.com.txt │ ├── tuaw.com.txt │ ├── wpmayor.com.txt │ ├── alsacreations.com.txt │ ├── ciaosamin.com.txt │ ├── cjr.org.txt │ ├── filamentgroup.com.txt │ ├── geeksofdoom.com.txt │ ├── higcapital.com.txt │ ├── mforum.cari.com.my.txt │ ├── mikeash.com.txt │ ├── neunetz.com.txt │ ├── omicrono.elespanol.com.txt │ ├── pharmazeutische-zeitung.de.txt │ ├── readability.com.txt │ ├── robots.thoughtbot.com.txt │ ├── seattletransitblog.com.txt │ ├── thinkprogress.org.txt │ ├── voltairenet.org.txt │ ├── basicthinking.de.txt │ ├── blog.eleven-labs.com.txt │ ├── diagonalperiodico.net.txt │ ├── ecranlarge.com.txt │ ├── heise-online.mobi.txt │ ├── humantransit.org.txt │ ├── inhabitat.com.txt │ ├── inquirer.com.txt │ ├── menshealth.com.sg.txt │ ├── rasgolatente.es.txt │ ├── sayidaty.net.txt │ ├── squashed.tumblr.com.txt │ ├── theage.com.au.txt │ ├── tijd.be.txt │ ├── toolinux.com.txt │ ├── adslzone.net.txt │ ├── blog.pinboard.in.txt │ ├── boundlessline.org.txt │ ├── engineering.tumblr.com.txt │ ├── gurumed.org.txt │ ├── hvg.hu.txt │ ├── papodehomem.com.br.txt │ ├── quantamagazine.org.txt │ ├── rachelandrew.co.uk.txt │ ├── rezeptwelt.de.txt │ ├── techcommunity.microsoft.com.txt │ ├── devlinsangle.blogspot.co.at.txt │ ├── glazman.org.txt │ ├── gnppn.fr.txt │ ├── hiphopleeft.nl.txt │ ├── icannabis.tumblr.com.txt │ ├── ilyabirman.ru.txt │ ├── itmedia.co.jp.txt │ ├── lehollandaisvolant.net.txt │ ├── nojesguiden.se.txt │ ├── rpgsite.net.txt │ ├── useit.com.txt │ ├── vitispr.com.txt │ ├── yostivanich.com.txt │ ├── 24.ae.txt │ ├── acroswing.fr.txt │ ├── gawker.com.txt │ ├── huffingtonpost.fr.txt │ ├── inessential.com.txt │ ├── omiliya.org.txt │ ├── popehat.com.txt │ ├── timeshighereducation.com.txt │ ├── accesstoinsight.org.txt │ ├── addendum.org.txt │ ├── americandrink.net.txt │ ├── blog.dropbox.com.txt │ ├── da.feedsportal.com.txt │ ├── ebay.com.txt │ ├── elmundo.es.txt │ ├── firstthings.com.txt │ ├── grafikart.fr.txt │ ├── itwire.com.txt │ ├── lezephyrmag.com.txt │ ├── libcom.org.txt │ ├── mintpressnews.com.txt │ ├── msdn.microsoft.com.txt │ ├── n0where.net.txt │ ├── pcmag.com.txt │ ├── politifact.com.txt │ ├── searchenginejournal.com.txt │ ├── telerama.fr.txt │ ├── thedrive.com.txt │ ├── timeshighereducation.co.uk.txt │ ├── wiki.guildwars.com.txt │ ├── 36kr.com.txt │ ├── annouchka.fr.txt │ ├── folklore.org.txt │ ├── gizmodo.uol.com.br.txt │ ├── haberler.com.txt │ ├── linuxjournal.com.txt │ ├── marco.org.txt │ ├── medialens.org.txt │ ├── nakedsecurity.sophos.com.txt │ ├── pastebin.com.txt │ ├── resume.se.txt │ ├── splinternews.com.txt │ ├── thesimpledollar.com.txt │ ├── wmpoweruser.com.txt │ ├── albayan.ae.txt │ ├── amandala.com.bz.txt │ ├── annatravelling.wordpress.com.txt │ ├── blog.kaelig.fr.txt │ ├── econlog.econlib.org.txt │ ├── ekultura.hu.txt │ ├── franceculture.fr.txt │ ├── gizmodo.co.uk.txt │ ├── gofugyourself.com.txt │ ├── healthletter.mayoclinic.com.txt │ ├── kottke.org.txt │ ├── netzpolitik.org.txt │ ├── phoronix.com.txt │ ├── usfirst.org.txt │ ├── warriordudimanche.net.txt │ ├── wiki.guildwars2.com.txt │ ├── aclu.org.txt │ ├── actualitte.com.txt │ ├── blog.mozilla.org.txt │ ├── coffeecircle.com.txt │ ├── csswizardry.com.txt │ ├── digital-photography-school.com.txt │ ├── enikos.gr.txt │ ├── fictionpress.com.txt │ ├── framablog.org.txt │ ├── generation-nt.com.txt │ ├── information.dk.txt │ ├── itsfoss.com.txt │ ├── kickstarter.com.txt │ ├── linux.com.txt │ ├── marmiton.org.txt │ ├── mentalfloss.com.txt │ ├── mirrorfootball.co.uk.txt │ ├── n-tv.de.txt │ ├── outsideonline.com.txt │ ├── parislemon.com.txt │ ├── venturebeat.com.txt │ ├── watoday.com.au.txt │ ├── alternet.org.txt │ ├── android-developers.googleblog.com.txt │ ├── autoblog.com.txt │ ├── gizmodo.com.txt │ ├── globalgrind.com.txt │ ├── hacks.mozilla.org.txt │ ├── jalopnik.com.txt │ ├── kotaku.com.txt │ ├── mlssoccer.com.txt │ ├── news.rambler.ru.txt │ ├── theinventory.com.txt │ ├── tvtropes.org.txt │ ├── whatever.scalzi.com.txt │ ├── aftenposten.no.txt │ ├── andy-bell.design.txt │ ├── asymco.com.txt │ ├── chrisltd.com.txt │ ├── christies.com.txt │ ├── css-tricks.com.txt │ ├── deadspin.com.txt │ ├── dev.to.txt │ ├── fivethirtyeight.com.txt │ ├── globalresearch.ca.txt │ ├── lifestyle.inquirer.net.txt │ ├── thetakeout.com.txt │ ├── blog.naver.com.txt │ ├── blogs.hbr.org.txt │ ├── computerworld.dk.txt │ ├── core77.com.txt │ ├── jezebel.com.txt │ ├── juppy.org.txt │ ├── mobile.lemondeinformatique.fr.txt │ ├── netzoekonom.de.txt │ ├── ontologicalgeek.com.txt │ ├── preparedfoods.com.txt │ ├── sydsvenskan.se.txt │ ├── techstage.de.txt │ ├── theonion.com.txt │ ├── wow.joystiq.com.txt │ ├── boagworld.com.txt │ ├── eleconomista.es.txt │ ├── idlewords.com.txt │ ├── mactalk.com.au.txt │ ├── newrepublic.com.txt │ ├── pathawks.com.txt │ ├── recode.net.txt │ ├── straightdope.com.txt │ ├── thrillist.com.txt │ ├── tomshardware.com.txt │ ├── trailerzone.de.txt │ ├── uefa.com.txt │ ├── washingtoninstitute.org.txt │ ├── worldpoultry.net.txt │ ├── xatakaciencia.com.txt │ ├── americastestkitchenfeed.com.txt │ ├── antirez.com.txt │ ├── blog.instagram.com.txt │ ├── blog.pchome.net.txt │ ├── daringfireball.net.txt │ ├── estadao.com.br.txt │ ├── gatopardo.com.txt │ ├── hackmake.org.txt │ ├── hurriyet.com.tr.txt │ ├── martinfowler.com.txt │ ├── nbnnews.com.au.txt │ ├── net-security.org.txt │ ├── rodrigo.sharpcube.com.txt │ ├── thegreatdiscontent.com.txt │ ├── theroot.com.txt │ ├── tomdispatch.com.txt │ ├── brainpickings.org.txt │ ├── champeau.info.txt │ ├── fanfiction.net.txt │ ├── iphonehacks.com.txt │ ├── news.com.au.txt │ ├── nrc.nl.txt │ ├── ntoskrnl.org.txt │ ├── planetvita.de.txt │ ├── puri.sm.txt │ ├── winfuture.de.txt │ ├── 24ways.org.txt │ ├── abc.es.txt │ ├── aws.amazon.com.txt │ ├── pittsburghmagazine.com.txt │ ├── privacyinternational.org.txt │ ├── prog21.dadgum.com.txt │ ├── scotusblog.com.txt │ ├── smbc-comics.com.txt │ ├── songshuhui.net.txt │ ├── trailers.apple.com.txt │ ├── cmswire.com.txt │ ├── habrahabr.ru.txt │ ├── hosted.ap.org.txt │ ├── ipadclub.nl.txt │ └── kenrockwell.com.txt ├── index.php ├── custom │ └── index.php └── README.txt ├── cache ├── index.php ├── rss │ └── index.php ├── rss-with-key │ └── index.php └── urls │ └── index.php ├── robots.txt ├── images └── agplv3.png ├── libraries ├── DisableSimplePieSanitize.php └── html5php │ └── HTML5 │ ├── Exception.php │ └── Parser │ └── ParseError.php └── app.json /.gitignore: -------------------------------------------------------------------------------- 1 | custom_config.php -------------------------------------------------------------------------------- /_config.yml: -------------------------------------------------------------------------------- 1 | theme: jekyll-theme-cayman -------------------------------------------------------------------------------- /vendor/composer/installed.json: -------------------------------------------------------------------------------- 1 | [] 2 | -------------------------------------------------------------------------------- /Procfile: -------------------------------------------------------------------------------- 1 | web: vendor/bin/heroku-php-nginx 2 | -------------------------------------------------------------------------------- /site_config/standard/version.txt: -------------------------------------------------------------------------------- 1 | 2014-05-05T08:36:15Z -------------------------------------------------------------------------------- /site_config/standard/getpocket.com.txt: -------------------------------------------------------------------------------- 1 | http_header(user-agent): PHP/5.3 -------------------------------------------------------------------------------- /cache/index.php: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /site_config/custom/index.php: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /site_config/standard/what-if.xkcd.com.txt: -------------------------------------------------------------------------------- 1 | autodetect_next_page: no 2 | test_url: http://what-if.xkcd.com/1/ -------------------------------------------------------------------------------- /site_config/standard/lukew.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | 3 | test_url: https://www.lukew.com/ff/entry.asp?1995 4 | -------------------------------------------------------------------------------- /site_config/standard/soundcity.tv.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: sharing 2 | 3 | test_url: http://soundcity.tv/feed/ 4 | -------------------------------------------------------------------------------- /site_config/standard/crimemagazine.com.txt: -------------------------------------------------------------------------------- 1 | autodetect_next_page: no 2 | test_url: http://www.crimemagazine.com/son-sam -------------------------------------------------------------------------------- /site_config/standard/ht.ly.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //iframe[@id='hootFrame']/@src 2 | 3 | test_url: http://ht.ly/bOiZV -------------------------------------------------------------------------------- /site_config/standard/the-magazine.org.txt: -------------------------------------------------------------------------------- 1 | tidy: no 2 | 3 | test_url: http://the-magazine.org/1/alone-together-again -------------------------------------------------------------------------------- /site_config/standard/pxlnv.com.txt: -------------------------------------------------------------------------------- 1 | date: //main//time/@datetime 2 | 3 | test_url: https://pxlnv.com/blog/bullshit-web/ 4 | -------------------------------------------------------------------------------- /site_config/standard/alex.mullr.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class="entry"] 2 | test_url: http://alex.mullr.net/blog/2011/05/on-spotify/ -------------------------------------------------------------------------------- /site_config/standard/chareidi.org.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | test_url: http://www.chareidi.org/archives5772/tetzaveh/TZV72adraft.htm -------------------------------------------------------------------------------- /site_config/standard/opensource.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='content clear-block'] 2 | test_url: http://opensource.org/node/537 -------------------------------------------------------------------------------- /site_config/standard/snip.ly.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //meta[@property="og:url"]/@content 2 | 3 | test_url: http://snip.ly/qa1R -------------------------------------------------------------------------------- /site_config/standard/techmeme.com.txt: -------------------------------------------------------------------------------- 1 | single_page_link_in_feed: //b/a 2 | 3 | test_url: http://www.techmeme.com/feed.xml 4 | -------------------------------------------------------------------------------- /site_config/standard/blog.fefe.de.txt: -------------------------------------------------------------------------------- 1 | title: //h2 2 | date: //h3 3 | body: //ul 4 | 5 | test_url: http://blog.fefe.de/?ts=b063bf55 -------------------------------------------------------------------------------- /site_config/standard/axesslab.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@id="main-content"] 2 | 3 | test_url: https://axesslab.com/disabled-buttons-suck/ 4 | -------------------------------------------------------------------------------- /site_config/standard/bitelia.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://bitelia.com/2011/09/klout-midiendo-influencia -------------------------------------------------------------------------------- /site_config/standard/blog.spu.edu.txt: -------------------------------------------------------------------------------- 1 | body://div[@class='post'] 2 | test_url: http://blog.spu.edu/lectio/from-the-frying-pan-into-the-fire/ -------------------------------------------------------------------------------- /site_config/standard/ecetia.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://ecetia.com/2011/09/vida-de-jugon-vii-las-tres-es -------------------------------------------------------------------------------- /site_config/standard/extracine.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://extracine.com/2011/09/straw-dogs-la-original -------------------------------------------------------------------------------- /site_config/standard/help.fivefilters.org.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class="title"]/h3 2 | date: substring-after(//div[@class="meta"], ": ") 3 | -------------------------------------------------------------------------------- /site_config/standard/jjahnke.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='entry'] 2 | prune: no 3 | 4 | test_url: http://www.jjahnke.net/rundbr87.html#2514 -------------------------------------------------------------------------------- /site_config/standard/kumailplus.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class = "entry-full"] 2 | 3 | test_url: http://www.kumailplus.com/2011/12/02/24308 -------------------------------------------------------------------------------- /site_config/standard/luxuo.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='post-content'] 2 | prune: no 3 | 4 | test_url: http://www.luxuo.com/watches/feed -------------------------------------------------------------------------------- /site_config/standard/t3n.de.txt: -------------------------------------------------------------------------------- 1 | next_page_link: //link[@rel='next'] 2 | 3 | test_url: http://t3n.de/news/zukunftstag-2017-t3n-818436/ 4 | -------------------------------------------------------------------------------- /site_config/standard/unherd.com.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: ref-ar 2 | 3 | test_url: https://unherd.com/2019/09/labours-brexit-shambles/ 4 | -------------------------------------------------------------------------------- /site_config/standard/zhuanlan.zhihu.com.txt: -------------------------------------------------------------------------------- 1 | http_header(user-agent): PHP/7.2 2 | 3 | test_url: https://zhuanlan.zhihu.com/p/67184988 4 | -------------------------------------------------------------------------------- /site_config/standard/facta.co.jp.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='content'] 2 | 3 | test_url: http://facta.co.jp/blog/archives/20111026001026.html 4 | -------------------------------------------------------------------------------- /site_config/standard/mattcutts.com.txt: -------------------------------------------------------------------------------- 1 | date: //*[@class = 'published'] 2 | test_url: http://www.mattcutts.com/blog/internet-censorship-sopa/ -------------------------------------------------------------------------------- /site_config/standard/meowni.ca.txt: -------------------------------------------------------------------------------- 1 | author: //meta[@name="author"]/@content 2 | 3 | test_url: https://meowni.ca/posts/2017-puppeteer-tests/ 4 | -------------------------------------------------------------------------------- /site_config/standard/motorfull.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://motorfull.com/2011/09/aparca-valeo-park4u-remote -------------------------------------------------------------------------------- /site_config/standard/roy.gbiv.com.txt: -------------------------------------------------------------------------------- 1 | strip_comments: no 2 | test_url: http://roy.gbiv.com/untangled/2008/rest-apis-must-be-hypertext-driven -------------------------------------------------------------------------------- /site_config/standard/512pixels.net.txt: -------------------------------------------------------------------------------- 1 | title: //meta[@property='og:title']/@content 2 | test_url: http://www.512pixels.net/blog/2014/10/the-move 3 | -------------------------------------------------------------------------------- /site_config/standard/apple.news.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //p//a[contains(., 'Click here')] 2 | test_url: https://apple.news/AHQREjzH0Ts6iikKhNe6o8w 3 | -------------------------------------------------------------------------------- /site_config/standard/elance.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='jobDesc-bd']/p 2 | 3 | test_url: http://www.elance.com/j/xml-technical-intergration/23687172/ -------------------------------------------------------------------------------- /site_config/standard/getnews.jp.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='post'] 2 | strip: //ul[@id='bookmark_single'] 3 | test_url: http://getnews.jp/archives/117312 -------------------------------------------------------------------------------- /site_config/standard/jamesclear.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'entry-content')] 2 | 3 | test_url: https://jamesclear.com/procrastination 4 | -------------------------------------------------------------------------------- /site_config/standard/lostgarden.com.txt: -------------------------------------------------------------------------------- 1 | prune: no 2 | convert_double_br_tags: yes 3 | test_url: http://www.lostgarden.com/2012/04/loops-and-arcs.html -------------------------------------------------------------------------------- /site_config/standard/mbl.is.txt: -------------------------------------------------------------------------------- 1 | body: //div[class="frett-main"] 2 | test_url: http://mbl.is/frettir/innlent/2012/02/21/litill_munur_a_fargjaldaverdi/ -------------------------------------------------------------------------------- /site_config/standard/n.survol.fr.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | date: //header//time/@datetime 3 | 4 | test_url: https://n.survol.fr/n/gerer-son-potager 5 | -------------------------------------------------------------------------------- /site_config/standard/acidcow.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[starts-with(@id, 'news-id-')] 2 | 3 | test_url: http://acidcow.com/fun/20933-acid-picdump-83-pics.html -------------------------------------------------------------------------------- /site_config/standard/alseraj.net.txt: -------------------------------------------------------------------------------- 1 | title: //*[@id='normalfontyellow'] 2 | test_url: http://www.alseraj.net/cgi-bin/pros/av/LeqaTextDisplay.cgi?display&2 -------------------------------------------------------------------------------- /site_config/standard/blogs.gnome.org.txt: -------------------------------------------------------------------------------- 1 | http_header(user-agent): PHP/7.2 2 | 3 | test_url: https://blogs.gnome.org/aday/2017/08/08/the-gnome-way/ 4 | -------------------------------------------------------------------------------- /site_config/standard/kachestvo.ru.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'inner_content')] 2 | 3 | test_url: http://kachestvo.ru/promtovar/odezhda/denim.html -------------------------------------------------------------------------------- /site_config/standard/monkeyzen.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://monkeyzen.com/2011/09/siluetas-de-clasicos-a-modo-de-vinilos -------------------------------------------------------------------------------- /site_config/standard/news.ycombinator.com.txt: -------------------------------------------------------------------------------- 1 | strip_comments: no 2 | strip: //a[. = 'reply'] 3 | test_url: http://news.ycombinator.com/item?id=1516461 -------------------------------------------------------------------------------- /site_config/standard/paquier.xyz.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='post'] 2 | 3 | test_url: http://paquier.xyz/postgresql-2/postgres-10-incompatible-changes/ 4 | -------------------------------------------------------------------------------- /site_config/standard/allafrica.com.txt: -------------------------------------------------------------------------------- 1 | http_header(user-agent): PHP/7.0 2 | 3 | test_url: http://allafrica.com/tools/headlines/rdf/latest/headlines.rdf 4 | -------------------------------------------------------------------------------- /site_config/standard/carlchenet.com.txt: -------------------------------------------------------------------------------- 1 | date: //time/@datetime 2 | 3 | test_url: https://carlchenet.com/foss-passive-consumerism-kills-our-community/ 4 | -------------------------------------------------------------------------------- /site_config/standard/doc.wallabag.org.txt: -------------------------------------------------------------------------------- 1 | body: //section[contains(@class, 'normal')] 2 | 3 | test_url: https://doc.wallabag.org/en/user/filters.html 4 | -------------------------------------------------------------------------------- /site_config/standard/eternabuenosaires.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://eternabuenosaires.com/2011/09/calle-adolfo-bioy-casares -------------------------------------------------------------------------------- /site_config/standard/fakirpresse.info.txt: -------------------------------------------------------------------------------- 1 | author: //a[@class="url fn spip_in"] 2 | 3 | test_url: https://www.fakirpresse.info/les-patrons-ca-osent-tout 4 | -------------------------------------------------------------------------------- /site_config/standard/fivefilters.org.txt: -------------------------------------------------------------------------------- 1 | body: //section[contains(@class, 'container')] 2 | prune: no 3 | 4 | test_url: http://fivefilters.org/kindle-it/ 5 | -------------------------------------------------------------------------------- /site_config/standard/fok.nl.txt: -------------------------------------------------------------------------------- 1 | # skip cookie warning 2 | single_page_link: concat(//form/@action, '?allowcookies=yes') 3 | 4 | test_url: http://fok.nl/687116 -------------------------------------------------------------------------------- /site_config/standard/gist.github.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class="highlight"]/pre 2 | 3 | prune: no 4 | tidy: no 5 | 6 | test_url: https://gist.github.com/1258908 -------------------------------------------------------------------------------- /site_config/standard/gsmarena.com.txt: -------------------------------------------------------------------------------- 1 | next_page_link: //a[@class='pages-next'] 2 | 3 | test_url: http://www.gsmarena.com/samsung_galaxy_j2-review-1348.php -------------------------------------------------------------------------------- /site_config/standard/indehekken.net.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='post-entry']/p 2 | 3 | test_url: http://www.indehekken.net/you-only-sing-when-youre-rowing/ 4 | -------------------------------------------------------------------------------- /site_config/standard/macdrifter.com.txt: -------------------------------------------------------------------------------- 1 | title: substring-before(//title,' « Macdrifter') 2 | test_url: http://www.macdrifter.com/2012/03/instacast-on-my-mac/ -------------------------------------------------------------------------------- /site_config/standard/marksdailyapple.com.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: wwsgd 2 | test_url: http://www.marksdailyapple.com/are-detoxes-and-cleanses-safe-and-effective/ -------------------------------------------------------------------------------- /site_config/standard/osmand.net.txt: -------------------------------------------------------------------------------- 1 | title: //div[@class="article"]//h2 2 | date: //meta/@pubdate 3 | 4 | test_url: https://osmand.net/blog/guideline-pt 5 | -------------------------------------------------------------------------------- /site_config/standard/summitroute.com.txt: -------------------------------------------------------------------------------- 1 | prune: no 2 | 3 | test_url: https://summitroute.com/blog/2015/12/24/instagram_bounty_case_study_for_defense/ 4 | -------------------------------------------------------------------------------- /site_config/standard/zerokspot.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@id="primarycontent"] 3 | test_url: http://zerokspot.com/weblog/2011/06/26/europython2011/ -------------------------------------------------------------------------------- /site_config/standard/blog.imirhil.fr.txt: -------------------------------------------------------------------------------- 1 | date: //section[@id="post"]//h1//time 2 | 3 | test_url: https://blog.imirhil.fr/2019/11/13/first-party-tracker.html 4 | -------------------------------------------------------------------------------- /site_config/standard/dagogtid.no.txt: -------------------------------------------------------------------------------- 1 | title: //span[@class = 'overskriftEkstrastor'] 2 | author: //em/a 3 | 4 | test_url: http://dagogtid.no/nyhet.cfm?nyhetid=2414 -------------------------------------------------------------------------------- /site_config/standard/dailydot.com.txt: -------------------------------------------------------------------------------- 1 | tidy: no 2 | body: //article 3 | 4 | test_url: http://www.dailydot.com/entertainment/tumblr-christopher-price-topherchris/ -------------------------------------------------------------------------------- /site_config/standard/drdobbs.com.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //a[contains(@href, '/article/print')] 2 | test_url: http://www.drdobbs.com/architecture-and-design/240001128 -------------------------------------------------------------------------------- /site_config/standard/flyingmachinestudios.com.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: linenos 2 | test_url: http://www.flyingmachinestudios.com/programming/whoops-dci-refactoring/ -------------------------------------------------------------------------------- /site_config/standard/gizmovil.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://gizmovil.com/2011/09/hipertextual-labs-receptor-bluetooth-nokia-bh-214 -------------------------------------------------------------------------------- /site_config/standard/goodfil.ms.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: gutter 2 | test_url: http://goodfil.ms/blog/posts/2012/08/13/angularjs-and-the-goodfilms-mobile-site-part-1/ -------------------------------------------------------------------------------- /site_config/standard/je-suis-papa.com.txt: -------------------------------------------------------------------------------- 1 | strip: //noscript 2 | 3 | test_url: http://www.je-suis-papa.com/pandacraft-kit-educatif-creatif-abonnement-12-ans/ 4 | -------------------------------------------------------------------------------- /site_config/standard/staltz.com.txt: -------------------------------------------------------------------------------- 1 | author: //h2[@class="name-title"] 2 | 3 | test_url: https://staltz.com/a-plan-to-rescue-the-web-from-the-internet.html 4 | -------------------------------------------------------------------------------- /site_config/standard/stjv.fr.txt: -------------------------------------------------------------------------------- 1 | date: //time[contains(@class, 'published')]/@datetime 2 | 3 | test_url: https://www.stjv.fr/2018/01/au-sujet-quantic-dream/ 4 | -------------------------------------------------------------------------------- /site_config/standard/appleweblog.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://appleweblog.com/2011/09/encontrada-vulnerabilidad-grave-en-skype-para-ios -------------------------------------------------------------------------------- /site_config/standard/dropbox.com.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //a[@id='download_button_link'] 2 | 3 | test_url: https://www.dropbox.com/s/qmocfrco2t0d28o/Fluffbeast.docx 4 | -------------------------------------------------------------------------------- /site_config/standard/gihyo.jp.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //p[@id='skip']//a[contains(@href, 'skip')] 2 | 3 | test_url: http://gihyo.jp/dev/serial/01/machine-learning/0010 -------------------------------------------------------------------------------- /site_config/standard/hiperpop.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://hiperpop.com/2011/09/marc-anthony-celebra-su-cumpleanos-con-jennifer-lopez -------------------------------------------------------------------------------- /site_config/standard/jungle-world.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[contains(@class,'story')] 3 | test_url: http://jungle-world.com/artikel/2015/02/51207.html 4 | -------------------------------------------------------------------------------- /site_config/standard/krone.at.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' kmm-article-box ')] 2 | 3 | test_url: https://www.krone.at/1941895 4 | -------------------------------------------------------------------------------- /site_config/standard/panic.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='entry'] 2 | date: //h3[@class='postDate'] 3 | test_url: http://www.panic.com/blog/2011/07/panic-is-ready-for-lion/ -------------------------------------------------------------------------------- /site_config/standard/tofugu.com.txt: -------------------------------------------------------------------------------- 1 | body://div[@class='entry-content'] 2 | 3 | test_url: http://www.tofugu.com/2015/07/20/interview-with-toriena-japanese-chiptune/ 4 | -------------------------------------------------------------------------------- /site_config/standard/urbandictionary.com.txt: -------------------------------------------------------------------------------- 1 | title: //title 2 | body: //table[@id='entries'] 3 | test_url: http://www.urbandictionary.com/define.php?term=Grown-Ass 4 | -------------------------------------------------------------------------------- /site_config/standard/vg.no.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='artikkelspalte'] 2 | strip_id_or_class: 'breadcrumb' 3 | test_url: http://www.vg.no/spill/artikkel.php?artid=10003628 -------------------------------------------------------------------------------- /site_config/standard/warnerbros.fr.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class="article-body"] 2 | test_url: https://www.warnerbros.fr/articles/magic-mike-xxl-adam-rodriguez-portrait 3 | -------------------------------------------------------------------------------- /site_config/standard/zataz.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class="blog-title"] 2 | 3 | test_url: https://www.zataz.com/bientot-noel-securisons-le-prochain-pc-de-la-famille/ 4 | -------------------------------------------------------------------------------- /site_config/standard/LICENSE.txt: -------------------------------------------------------------------------------- 1 | These files are released to the public domain. 2 | 3 | See https://creativecommons.org/publicdomain/zero/1.0/ for more information. 4 | -------------------------------------------------------------------------------- /site_config/standard/altfoto.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://altfoto.com/2011/09/nikon-presenta-su-nuevo-sistema-nikon-1-y-dos-nuevas-camaras -------------------------------------------------------------------------------- /site_config/standard/blogs.forbes.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='entry'] 2 | test_url: http://blogs.forbes.com/adamhartung/2011/04/08/apple-is-better-managed-than-microsoft/ -------------------------------------------------------------------------------- /site_config/standard/brucelawson.co.uk.txt: -------------------------------------------------------------------------------- 1 | title: //h2[@itemprop="title"] 2 | 3 | test_url: https://www.brucelawson.co.uk/2018/the-practical-value-of-semantic-html/ 4 | -------------------------------------------------------------------------------- /site_config/standard/cucharasonica.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://cucharasonica.com/2011/09/queen-busca-candidatos-para-su-propia-banda-tributo -------------------------------------------------------------------------------- /site_config/standard/dansdata.com.txt: -------------------------------------------------------------------------------- 1 | autodetect_next_page: no 2 | tidy: no 3 | prune: no 4 | body: //div[@class='NoOverflow'] 5 | test_url: http://www.dansdata.com/gz129.htm -------------------------------------------------------------------------------- /site_config/standard/hipertextual.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://hipertextual.com/2011/09/banda-ancha-en-america-latina-insignificante 3 | -------------------------------------------------------------------------------- /site_config/standard/interviewmagazine.com.txt: -------------------------------------------------------------------------------- 1 | title: //title 2 | body: //div[contains(@class, 'block')] 3 | 4 | test_url: http://www.interviewmagazine.com/film/spike-jonze -------------------------------------------------------------------------------- /site_config/standard/jvt.me.txt: -------------------------------------------------------------------------------- 1 | author: //div[@class="post-details"]//a[contains(@class, "p-name")] 2 | 3 | test_url: https://www.jvt.me/posts/2019/10/20/indieweb-talk/ 4 | -------------------------------------------------------------------------------- /site_config/standard/phototrend.fr.txt: -------------------------------------------------------------------------------- 1 | author: //div[contains(@class, "vcard")] 2 | 3 | test_url: https://phototrend.fr/2019/04/mise-a-jour-luminar-3-1-0-accent-ai-2-0/ 4 | -------------------------------------------------------------------------------- /site_config/standard/portertech.ca.txt: -------------------------------------------------------------------------------- 1 | author: //*[(@class = "author")] 2 | date: //*[(@class = "date")] 3 | test_url: http://portertech.ca/2012/12/10/iac-morning-market/ -------------------------------------------------------------------------------- /site_config/standard/renenekuda.cz.txt: -------------------------------------------------------------------------------- 1 | title: //*[@class='entry-title'] 2 | body: //div[@class='entry-content'] 3 | test_url: http://www.renenekuda.cz/recept-na-produktivitu/ -------------------------------------------------------------------------------- /site_config/standard/usccb.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='CS_Element_maincontent'] 2 | 3 | tidy: no 4 | prune: no 5 | 6 | test_url: http://www.usccb.org/bible/readings/072412.cfm -------------------------------------------------------------------------------- /site_config/standard/crn.de.txt: -------------------------------------------------------------------------------- 1 | author: //p[contains(@class,'author')]/a 2 | date: //div[contains(@class,'date')] 3 | test_url: http://www.crn.de/netzwerke-tk/artikel-93103.html -------------------------------------------------------------------------------- /site_config/standard/eff.org.txt: -------------------------------------------------------------------------------- 1 | author: //meta[@name="author"]/@content 2 | 3 | test_url: https://www.eff.org/deeplinks/2018/02/john-perry-barlow-internet-pioneer-1947-2018 4 | -------------------------------------------------------------------------------- /site_config/standard/finexpert.e15.cz.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: article-linktoanother 2 | 3 | test_url: http://finexpert.e15.cz/budiz-teplo-eu-stedre-zadotuje-nejen-plynovy-kotel -------------------------------------------------------------------------------- /site_config/standard/marigold.cz.txt: -------------------------------------------------------------------------------- 1 | http_header(accept): */* 2 | 3 | test_url: https://www.marigold.cz/item/projektovy-manazer-je-v-cesku-sproste-slovo-ke-skode-projektu 4 | -------------------------------------------------------------------------------- /site_config/standard/news.rub.de.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' content-inner-inner-wrapper ')] 2 | 3 | http_header(Cookie): has_js=1 4 | -------------------------------------------------------------------------------- /site_config/standard/news.techmeme.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='main']/div[@class='item'] 2 | strip: //div[@class='right'] 3 | 4 | test_url: http://news.techmeme.com/110516/fh-rip -------------------------------------------------------------------------------- /site_config/standard/pentaxforums.com.txt: -------------------------------------------------------------------------------- 1 | next_page_link: //a[contains(., 'Next:')] 2 | test_url: http://www.pentaxforums.com/reviews/long-exposure-handhelds/introduction.html -------------------------------------------------------------------------------- /site_config/standard/pieria.co.uk.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='article'] 2 | 3 | test_url: http://www.pieria.co.uk/articles/need_a_fiscal_rule_george__try_get_the_economy_growing 4 | -------------------------------------------------------------------------------- /site_config/standard/tldp.org.txt: -------------------------------------------------------------------------------- 1 | title: //title 2 | body: //h2 | //p | //ul 3 | prune: no 4 | tidy: no 5 | 6 | test_url: http://www.tldp.org/HOWTO/Plug-and-Play-HOWTO-7.html -------------------------------------------------------------------------------- /site_config/standard/gizmologia.com.txt: -------------------------------------------------------------------------------- 1 | body: //*[(@class = "historia")] 2 | test_url: http://gizmologia.com/2011/09/amd-trinity-el-sucesor-de-llano-en-una-demostracion-muy-interesante -------------------------------------------------------------------------------- /site_config/standard/happyassassin.net.txt: -------------------------------------------------------------------------------- 1 | http_header(user-agent): PHP/7.2 2 | 3 | test_url: https://www.happyassassin.net/2014/01/25/uefi-boot-how-does-that-actually-work-then/ 4 | -------------------------------------------------------------------------------- /site_config/standard/iansommerville.com.txt: -------------------------------------------------------------------------------- 1 | http_header(user-agent): PHP/5.3 2 | 3 | test_url: http://iansommerville.com/blog/a-guide-to-scottish-delicacies-for-tgo-challengers/ 4 | -------------------------------------------------------------------------------- /site_config/standard/iplaysoft.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content']//div[@class='entry-banner' or @class='entry-content'] 2 | test_url: http://www.iplaysoft.com/webbrowserpassview.html -------------------------------------------------------------------------------- /site_config/standard/lefilrouge.media.txt: -------------------------------------------------------------------------------- 1 | 2 | strip_id_or_class: the_champ_sharing_container 3 | 4 | test_url: https://lefilrouge.media/etats-unis-nevada-burning-man-festival/ 5 | -------------------------------------------------------------------------------- /site_config/standard/lupa.cz.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: promo-in-article 2 | 3 | test_url: http://www.lupa.cz/clanky/michal-zamec-parfums-za-dva-roky-presahneme-obrat-6-miliard-korun/ -------------------------------------------------------------------------------- /site_config/standard/matt.might.net.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | author: string("Matt Might") 3 | strip: //h1/following-sibling::div 4 | 5 | test_url: http://matt.might.net/articles/oo-cesk/ -------------------------------------------------------------------------------- /site_config/standard/monkeyuser.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ', normalize-space(@class), ' '), ' content ')] 2 | 3 | test_url: https://www.monkeyuser.com/2019/v-201/ 4 | -------------------------------------------------------------------------------- /site_config/standard/radionz.co.nz.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='body'] 2 | title: //div[@class='newsstory']/h2 3 | test_url: http://www.radionz.co.nz/news/stories/2010/07/18/12481029a86d -------------------------------------------------------------------------------- /site_config/standard/sivers.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='content']//article 2 | 3 | strip: //header 4 | strip: //footer 5 | 6 | prune: no 7 | 8 | test_url: https://sivers.org/exex 9 | -------------------------------------------------------------------------------- /site_config/standard/thenews.coop.txt: -------------------------------------------------------------------------------- 1 | body: //div[@itemprop='articleBody'] 2 | 3 | test_url: http://www.thenews.coop/98221/news/co-operatives/jeremy-corbyn-needs-co-op-movement/ 4 | -------------------------------------------------------------------------------- /site_config/standard/turnoff.us.txt: -------------------------------------------------------------------------------- 1 | title: //h1[@class='post-title'] 2 | body: //article[@class='post-content'] 3 | test_url: https://turnoff.us/geek/the-depressed-developer-13/ 4 | -------------------------------------------------------------------------------- /site_config/standard/utdailybeacon.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='blox-story-text'] 2 | test_url: http://www.utdailybeacon.com/news/article_ccf6d024-0f15-11e5-ae29-9f63598deb81.html 3 | -------------------------------------------------------------------------------- /site_config/standard/worldwidewords.org.txt: -------------------------------------------------------------------------------- 1 | title: //p[@id='content'] 2 | 3 | body: //div[@class='contentblock'] 4 | test_url: http://www.worldwidewords.org/weirdwords/ww-gro1.htm -------------------------------------------------------------------------------- /site_config/standard/betabeat.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class="entry-content"] 2 | test_url: http://www.betabeat.com/2011/07/04/sheryl-sandberg-breaks-through-silicon-valleys-boys-club-sort-of/ -------------------------------------------------------------------------------- /site_config/standard/cashless.pl.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(concat(' ',normalize-space(@class),' '),' post-page-content ')] 2 | 3 | test_url: https://www.cashless.pl/5465-revolut-kryzys 4 | -------------------------------------------------------------------------------- /site_config/standard/davidwalsh.name.txt: -------------------------------------------------------------------------------- 1 | author: //article//span[@itemprop="name"] 2 | strip: //div[@class="article-block"] 3 | 4 | test_url: https://davidwalsh.name/optional-chaining 5 | -------------------------------------------------------------------------------- /site_config/standard/democracynow.org.txt: -------------------------------------------------------------------------------- 1 | body: //div[contains(@class, 'blog_body')] 2 | 3 | prune: no 4 | 5 | test_url: http://www.democracynow.org/blog/2014/1/9/the_fbi_the_nsa_and_a -------------------------------------------------------------------------------- /site_config/standard/explosm.net.txt: -------------------------------------------------------------------------------- 1 | body: //img[@id='main-comic'] 2 | author: substring(//small[@class="author-credit-name"], 4) 3 | 4 | test_url: http://explosm.net/comics/3954/ 5 | -------------------------------------------------------------------------------- /site_config/standard/freelancer.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id="projectDetailsContent"]//td 2 | 3 | test_url: http://www.freelancer.com/projects/PHP-Website-Design/debug-Forum-website-code.html -------------------------------------------------------------------------------- /site_config/standard/gauchiste.fr.txt: -------------------------------------------------------------------------------- 1 | date: //meta[@name="date"]/@content 2 | 3 | test_url: https://gauchiste.fr/post/2019/11/08/Un-catadioptre-vous-sauvera-(peut-%C3%AAtre)-la-vie 4 | -------------------------------------------------------------------------------- /site_config/standard/hs.fi.txt: -------------------------------------------------------------------------------- 1 | prune: yes 2 | tidy: yes 3 | test_url: http://www.hs.fi/kotimaa/Teollisuushallin%20palo%20levitt%C3%A4%C3%A4%20vaarallista%20savua%20Tuusulassa/a1305571582405 -------------------------------------------------------------------------------- /site_config/standard/izismile.com.txt: -------------------------------------------------------------------------------- 1 | body: //div[starts-with(@id, 'news-id-')] 2 | prune: no 3 | 4 | test_url: http://izismile.com/2011/06/13/uncanny_factoid_fashion_or_creepy_2_pics.html -------------------------------------------------------------------------------- /site_config/standard/jobbank.gc.ca.txt: -------------------------------------------------------------------------------- 1 | body: //div[@id='formatCont_en'] 2 | 3 | prune: no 4 | 5 | test_url: http://www.jobbank.gc.ca/detail-eng.aspx?Source=JobPosting&OrderNum=6397922 -------------------------------------------------------------------------------- /site_config/standard/mein-mmo.de.txt: -------------------------------------------------------------------------------- 1 | body: //div[@class='gp-entry-text'] 2 | strip: //aside 3 | 4 | test_url: http://mein-mmo.de/pokemon-go-15-staerksten-pokemon-der-2-generation/ 5 | -------------------------------------------------------------------------------- /site_config/standard/mytotalretail.com.txt: -------------------------------------------------------------------------------- 1 | title: //h1 2 | body: //div[@itemprop="content"] 3 | 4 | test_url: https://www.mytotalretail.com/article/how-site-search-could-kill-amazon/ 5 | -------------------------------------------------------------------------------- /site_config/standard/nplusonemag.com.txt: -------------------------------------------------------------------------------- 1 | title: /html/body/div[3]/div/div/h1 2 | 3 | body: //*[@id="article-body"] 4 | 5 | 6 | test_url: http://nplusonemag.com/the-outskirts-of-progress -------------------------------------------------------------------------------- /site_config/standard/signal.org.txt: -------------------------------------------------------------------------------- 1 | title: //h2[@class="post-title"] 2 | author: //h3[@class="post-subtitle"]//a 3 | 4 | test_url: https://signal.org/blog/signal-private-group-system/ 5 | -------------------------------------------------------------------------------- /site_config/standard/stumbleupon.com.txt: -------------------------------------------------------------------------------- 1 | single_page_link: //iframe[@id='tb-stumble-frame']/@src 2 | 3 | test_url: http://www.stumbleupon.com/su/35V0wB/zouchmagazine.com/poetry-violet/ -------------------------------------------------------------------------------- /site_config/standard/www3.imperial.ac.uk.txt: -------------------------------------------------------------------------------- 1 | strip_id_or_class: hidelabel 2 | test_url: http://www3.imperial.ac.uk/newsandeventspggrp/imperialcollege/newssummary/news_14-7-2010-15-53-18 -------------------------------------------------------------------------------- /libraries/DisableSimplePieSanitize.php: -------------------------------------------------------------------------------- 1 | ):