├── .DS_Store
├── .gitignore
├── app.yaml
├── bs4
    ├── __init__.py
    ├── builder
    │   ├── __init__.py
    │   ├── _html5lib.py
    │   ├── _htmlparser.py
    │   └── _lxml.py
    ├── dammit.py
    ├── diagnose.py
    ├── element.py
    ├── testing.py
    └── tests
    │   ├── __init__.py
    │   ├── test_builder_registry.py
    │   ├── test_docs.py
    │   ├── test_html5lib.py
    │   ├── test_htmlparser.py
    │   ├── test_lxml.py
    │   ├── test_soup.py
    │   └── test_tree.py
├── cassis.py
├── dateutil
    ├── __init__.py
    ├── easter.py
    ├── parser.py
    ├── relativedelta.py
    ├── rrule.py
    ├── tz.py
    ├── tzwin.py
    └── zoneinfo
    │   ├── __init__.py
    │   └── zoneinfo-2010g.tar.gz
├── favicon.ico
├── feedparser.py
├── hfeed.html
├── hfeedello.html
├── hfeedmasto.html
├── hovercard.html
├── hovercard2.html
├── hovertest.html
├── html5lib
    ├── .DS_Store
    ├── __init__.py
    ├── constants.py
    ├── filters
    │   ├── __init__.py
    │   ├── _base.py
    │   ├── alphabeticalattributes.py
    │   ├── inject_meta_charset.py
    │   ├── lint.py
    │   ├── optionaltags.py
    │   ├── sanitizer.py
    │   └── whitespace.py
    ├── html5parser.py
    ├── ihatexml.py
    ├── inputstream.py
    ├── sanitizer.py
    ├── serializer
    │   ├── __init__.py
    │   └── htmlserializer.py
    ├── tokenizer.py
    ├── treeadapters
    │   ├── __init__.py
    │   └── sax.py
    ├── treebuilders
    │   ├── __init__.py
    │   ├── _base.py
    │   ├── dom.py
    │   ├── etree.py
    │   └── etree_lxml.py
    ├── treewalkers
    │   ├── __init__.py
    │   ├── _base.py
    │   ├── dom.py
    │   ├── etree.py
    │   ├── genshistream.py
    │   ├── lxmletree.py
    │   └── pulldom.py
    ├── trie
    │   ├── __init__.py
    │   ├── _base.py
    │   ├── datrie.py
    │   └── py.py
    └── utils.py
├── humanize
    ├── __init__.py
    ├── compat.py
    ├── filesize.py
    ├── i18n.py
    ├── locale
    │   ├── fr_FR
    │   │   └── LC_MESSAGES
    │   │   │   └── humanize.po
    │   ├── ko_KR
    │   │   └── LC_MESSAGES
    │   │   │   └── humanize.po
    │   └── ru_RU
    │   │   └── LC_MESSAGES
    │   │       └── humanize.po
    ├── number.py
    └── time.py
├── index.html
├── indiecard.html
├── instancelist.html
├── instances.json
├── joyline.svg
├── markedup.html
├── mf2py
    ├── .DS_Store
    ├── __init__.py
    ├── backcompat-rules
    │   ├── adr.json
    │   ├── geo.json
    │   ├── hentry.json
    │   ├── hfeed.json
    │   ├── hproduct.json
    │   ├── hrecipe.json
    │   ├── hresume.json
    │   ├── hreview-aggregate.json
    │   ├── hreview.json
    │   ├── recipe-main-info.json
    │   ├── vcard.json
    │   └── vevent.json
    ├── backcompat.py
    ├── datetime_helpers.py
    ├── dom_helpers.py
    ├── implied_properties.py
    ├── mf2_classes.py
    ├── mf_helpers.py
    ├── parse_property.py
    ├── parser.py
    ├── temp_fixes.py
    ├── value_class_pattern.py
    └── version.py
├── mf2tojf2.py
├── oembedcard.html
├── openanything.py
├── queue.yaml
├── requests
    ├── .DS_Store
    ├── __init__.py
    ├── adapters.py
    ├── api.py
    ├── auth.py
    ├── cacert.pem
    ├── certs.py
    ├── compat.py
    ├── cookies.py
    ├── exceptions.py
    ├── hooks.py
    ├── models.py
    ├── packages
    │   ├── __init__.py
    │   ├── chardet
    │   │   ├── __init__.py
    │   │   ├── big5freq.py
    │   │   ├── big5prober.py
    │   │   ├── chardetect.py
    │   │   ├── chardistribution.py
    │   │   ├── charsetgroupprober.py
    │   │   ├── charsetprober.py
    │   │   ├── codingstatemachine.py
    │   │   ├── compat.py
    │   │   ├── constants.py
    │   │   ├── cp949prober.py
    │   │   ├── escprober.py
    │   │   ├── escsm.py
    │   │   ├── eucjpprober.py
    │   │   ├── euckrfreq.py
    │   │   ├── euckrprober.py
    │   │   ├── euctwfreq.py
    │   │   ├── euctwprober.py
    │   │   ├── gb2312freq.py
    │   │   ├── gb2312prober.py
    │   │   ├── hebrewprober.py
    │   │   ├── jisfreq.py
    │   │   ├── jpcntx.py
    │   │   ├── langbulgarianmodel.py
    │   │   ├── langcyrillicmodel.py
    │   │   ├── langgreekmodel.py
    │   │   ├── langhebrewmodel.py
    │   │   ├── langhungarianmodel.py
    │   │   ├── langthaimodel.py
    │   │   ├── latin1prober.py
    │   │   ├── mbcharsetprober.py
    │   │   ├── mbcsgroupprober.py
    │   │   ├── mbcssm.py
    │   │   ├── sbcharsetprober.py
    │   │   ├── sbcsgroupprober.py
    │   │   ├── sjisprober.py
    │   │   ├── universaldetector.py
    │   │   └── utf8prober.py
    │   └── urllib3
    │   │   ├── __init__.py
    │   │   ├── _collections.py
    │   │   ├── connection.py
    │   │   ├── connectionpool.py
    │   │   ├── contrib
    │   │       ├── __init__.py
    │   │       ├── ntlmpool.py
    │   │       └── pyopenssl.py
    │   │   ├── exceptions.py
    │   │   ├── fields.py
    │   │   ├── filepost.py
    │   │   ├── packages
    │   │       ├── __init__.py
    │   │       ├── ordered_dict.py
    │   │       ├── six.py
    │   │       └── ssl_match_hostname
    │   │       │   ├── __init__.py
    │   │       │   └── _implementation.py
    │   │   ├── poolmanager.py
    │   │   ├── request.py
    │   │   ├── response.py
    │   │   └── util
    │   │       ├── __init__.py
    │   │       ├── connection.py
    │   │       ├── request.py
    │   │       ├── response.py
    │   │       ├── retry.py
    │   │       ├── ssl_.py
    │   │       ├── timeout.py
    │   │       └── url.py
    ├── sessions.py
    ├── status_codes.py
    ├── structures.py
    └── utils.py
├── shrunkeninline.html
├── shrunkensite.html
├── six.py
├── sparkline.html
├── static
    ├── awesomplete.min.js
    ├── fragmention.js
    ├── index.html
    ├── landscape.jpg
    └── landscape2.jpg
├── storycard.html
├── styles
    ├── awesomplete.css
    ├── hfeed.css
    ├── hovercard.css
    ├── hovercard2.css
    ├── indiecard.css
    ├── mastoview.css
    └── storycard.css
├── unmung.py
├── vrcard.html
├── xoxo.py
└── xoxopodcast.xml


/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/.DS_Store


--------------------------------------------------------------------------------
/.gitignore:
--------------------------------------------------------------------------------
1 | *.pyc


--------------------------------------------------------------------------------
/app.yaml:
--------------------------------------------------------------------------------
 1 | application: unmung2
 2 | version: 2
 3 | runtime: python27
 4 | api_version: 1
 5 | threadsafe: true
 6 | 
 7 | handlers:
 8 | - url: /styles
 9 |   static_dir: styles
10 | - url: /images
11 |   static_dir: images
12 | - url: /static
13 |   static_dir: static
14 | - url: /.*
15 |   script: unmung.application
16 | 
17 | # [START libraries]
18 | libraries:
19 | - name: webapp2
20 |   version: latest
21 | - name: jinja2
22 |   version: latest
23 | - name: ssl
24 |   version: latest
25 | - name: lxml
26 |   version: latest
27 | # [END libraries]


--------------------------------------------------------------------------------
/bs4/tests/__init__.py:
--------------------------------------------------------------------------------
1 | "The beautifulsoup tests."
2 | 


--------------------------------------------------------------------------------
/bs4/tests/test_docs.py:
--------------------------------------------------------------------------------
 1 | "Test harness for doctests."
 2 | 
 3 | # pylint: disable-msg=E0611,W0142
 4 | 
 5 | __metaclass__ = type
 6 | __all__ = [
 7 |     'additional_tests',
 8 |     ]
 9 | 
10 | import atexit
11 | import doctest
12 | import os
13 | #from pkg_resources import (
14 | #    resource_filename, resource_exists, resource_listdir, cleanup_resources)
15 | import unittest
16 | 
17 | DOCTEST_FLAGS = (
18 |     doctest.ELLIPSIS |
19 |     doctest.NORMALIZE_WHITESPACE |
20 |     doctest.REPORT_NDIFF)
21 | 
22 | 
23 | # def additional_tests():
24 | #     "Run the doc tests (README.txt and docs/*, if any exist)"
25 | #     doctest_files = [
26 | #         os.path.abspath(resource_filename('bs4', 'README.txt'))]
27 | #     if resource_exists('bs4', 'docs'):
28 | #         for name in resource_listdir('bs4', 'docs'):
29 | #             if name.endswith('.txt'):
30 | #                 doctest_files.append(
31 | #                     os.path.abspath(
32 | #                         resource_filename('bs4', 'docs/%s' % name)))
33 | #     kwargs = dict(module_relative=False, optionflags=DOCTEST_FLAGS)
34 | #     atexit.register(cleanup_resources)
35 | #     return unittest.TestSuite((
36 | #         doctest.DocFileSuite(*doctest_files, **kwargs)))
37 | 


--------------------------------------------------------------------------------
/bs4/tests/test_htmlparser.py:
--------------------------------------------------------------------------------
 1 | """Tests to ensure that the html.parser tree builder generates good
 2 | trees."""
 3 | 
 4 | from pdb import set_trace
 5 | import pickle
 6 | from bs4.testing import SoupTest, HTMLTreeBuilderSmokeTest
 7 | from bs4.builder import HTMLParserTreeBuilder
 8 | from bs4.builder._htmlparser import BeautifulSoupHTMLParser
 9 | 
10 | class HTMLParserTreeBuilderSmokeTest(SoupTest, HTMLTreeBuilderSmokeTest):
11 | 
12 |     @property
13 |     def default_builder(self):
14 |         return HTMLParserTreeBuilder()
15 | 
16 |     def test_namespaced_system_doctype(self):
17 |         # html.parser can't handle namespaced doctypes, so skip this one.
18 |         pass
19 | 
20 |     def test_namespaced_public_doctype(self):
21 |         # html.parser can't handle namespaced doctypes, so skip this one.
22 |         pass
23 | 
24 |     def test_builder_is_pickled(self):
25 |         """Unlike most tree builders, HTMLParserTreeBuilder and will
26 |         be restored after pickling.
27 |         """
28 |         tree = self.soup("<a><b>foo</a>")
29 |         dumped = pickle.dumps(tree, 2)
30 |         loaded = pickle.loads(dumped)
31 |         self.assertTrue(isinstance(loaded.builder, type(tree.builder)))
32 | 
33 |     def test_redundant_empty_element_closing_tags(self):
34 |         self.assertSoupEquals('<br></br><br></br><br></br>', "<br/><br/><br/>")
35 |         self.assertSoupEquals('</br></br></br>', "")
36 | 
37 |     def test_empty_element(self):
38 |         # This verifies that any buffered data present when the parser
39 |         # finishes working is handled.
40 |         self.assertSoupEquals("foo &# bar", "foo &amp;# bar")
41 | 
42 | 
43 | class TestHTMLParserSubclass(SoupTest):
44 |     def test_error(self):
45 |         """Verify that our HTMLParser subclass implements error() in a way
46 |         that doesn't cause a crash.
47 |         """
48 |         parser = BeautifulSoupHTMLParser()
49 |         parser.error("don't crash")
50 | 


--------------------------------------------------------------------------------
/bs4/tests/test_lxml.py:
--------------------------------------------------------------------------------
 1 | """Tests to ensure that the lxml tree builder generates good trees."""
 2 | 
 3 | import re
 4 | import warnings
 5 | 
 6 | try:
 7 |     import lxml.etree
 8 |     LXML_PRESENT = True
 9 |     LXML_VERSION = lxml.etree.LXML_VERSION
10 | except ImportError, e:
11 |     LXML_PRESENT = False
12 |     LXML_VERSION = (0,)
13 | 
14 | if LXML_PRESENT:
15 |     from bs4.builder import LXMLTreeBuilder, LXMLTreeBuilderForXML
16 | 
17 | from bs4 import (
18 |     BeautifulSoup,
19 |     BeautifulStoneSoup,
20 |     )
21 | from bs4.element import Comment, Doctype, SoupStrainer
22 | from bs4.testing import skipIf
23 | from bs4.tests import test_htmlparser
24 | from bs4.testing import (
25 |     HTMLTreeBuilderSmokeTest,
26 |     XMLTreeBuilderSmokeTest,
27 |     SoupTest,
28 |     skipIf,
29 | )
30 | 
31 | @skipIf(
32 |     not LXML_PRESENT,
33 |     "lxml seems not to be present, not testing its tree builder.")
34 | class LXMLTreeBuilderSmokeTest(SoupTest, HTMLTreeBuilderSmokeTest):
35 |     """See ``HTMLTreeBuilderSmokeTest``."""
36 | 
37 |     @property
38 |     def default_builder(self):
39 |         return LXMLTreeBuilder()
40 | 
41 |     def test_out_of_range_entity(self):
42 |         self.assertSoupEquals(
43 |             "<p>foo&#10000000000000;bar</p>", "<p>foobar</p>")
44 |         self.assertSoupEquals(
45 |             "<p>foo&#x10000000000000;bar</p>", "<p>foobar</p>")
46 |         self.assertSoupEquals(
47 |             "<p>foo&#1000000000;bar</p>", "<p>foobar</p>")
48 | 
49 |     def test_entities_in_foreign_document_encoding(self):
50 |         # We can't implement this case correctly because by the time we
51 |         # hear about markup like "&#147;", it's been (incorrectly) converted into
52 |         # a string like u'\x93'
53 |         pass
54 |         
55 |     # In lxml < 2.3.5, an empty doctype causes a segfault. Skip this
56 |     # test if an old version of lxml is installed.
57 | 
58 |     @skipIf(
59 |         not LXML_PRESENT or LXML_VERSION < (2,3,5,0),
60 |         "Skipping doctype test for old version of lxml to avoid segfault.")
61 |     def test_empty_doctype(self):
62 |         soup = self.soup("<!DOCTYPE>")
63 |         doctype = soup.contents[0]
64 |         self.assertEqual("", doctype.strip())
65 | 
66 |     def test_beautifulstonesoup_is_xml_parser(self):
67 |         # Make sure that the deprecated BSS class uses an xml builder
68 |         # if one is installed.
69 |         with warnings.catch_warnings(record=True) as w:
70 |             soup = BeautifulStoneSoup("<b />")
71 |         self.assertEqual(u"<b/>", unicode(soup.b))
72 |         self.assertTrue("BeautifulStoneSoup class is deprecated" in str(w[0].message))
73 | 
74 | @skipIf(
75 |     not LXML_PRESENT,
76 |     "lxml seems not to be present, not testing its XML tree builder.")
77 | class LXMLXMLTreeBuilderSmokeTest(SoupTest, XMLTreeBuilderSmokeTest):
78 |     """See ``HTMLTreeBuilderSmokeTest``."""
79 | 
80 |     @property
81 |     def default_builder(self):
82 |         return LXMLTreeBuilderForXML()
83 | 


--------------------------------------------------------------------------------
/dateutil/__init__.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Copyright (c) 2003-2010  Gustavo Niemeyer <gustavo@niemeyer.net>
 3 | 
 4 | This module offers extensions to the standard python 2.3+
 5 | datetime module.
 6 | """
 7 | __author__ = "Gustavo Niemeyer <gustavo@niemeyer.net>"
 8 | __license__ = "PSF License"
 9 | __version__ = "1.5"
10 | 


--------------------------------------------------------------------------------
/dateutil/easter.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Copyright (c) 2003-2007  Gustavo Niemeyer <gustavo@niemeyer.net>
 3 | 
 4 | This module offers extensions to the standard python 2.3+
 5 | datetime module.
 6 | """
 7 | __author__ = "Gustavo Niemeyer <gustavo@niemeyer.net>"
 8 | __license__ = "PSF License"
 9 | 
10 | import datetime
11 | 
12 | __all__ = ["easter", "EASTER_JULIAN", "EASTER_ORTHODOX", "EASTER_WESTERN"]
13 | 
14 | EASTER_JULIAN   = 1
15 | EASTER_ORTHODOX = 2
16 | EASTER_WESTERN  = 3
17 | 
18 | def easter(year, method=EASTER_WESTERN):
19 |     """
20 |     This method was ported from the work done by GM Arts,
21 |     on top of the algorithm by Claus Tondering, which was
22 |     based in part on the algorithm of Ouding (1940), as
23 |     quoted in "Explanatory Supplement to the Astronomical
24 |     Almanac", P.  Kenneth Seidelmann, editor.
25 | 
26 |     This algorithm implements three different easter
27 |     calculation methods:
28 |     
29 |     1 - Original calculation in Julian calendar, valid in
30 |         dates after 326 AD
31 |     2 - Original method, with date converted to Gregorian
32 |         calendar, valid in years 1583 to 4099
33 |     3 - Revised method, in Gregorian calendar, valid in
34 |         years 1583 to 4099 as well
35 | 
36 |     These methods are represented by the constants:
37 | 
38 |     EASTER_JULIAN   = 1
39 |     EASTER_ORTHODOX = 2
40 |     EASTER_WESTERN  = 3
41 | 
42 |     The default method is method 3.
43 |     
44 |     More about the algorithm may be found at:
45 | 
46 |     http://users.chariot.net.au/~gmarts/eastalg.htm
47 | 
48 |     and
49 | 
50 |     http://www.tondering.dk/claus/calendar.html
51 | 
52 |     """
53 | 
54 |     if not (1 <= method <= 3):
55 |         raise ValueError, "invalid method"
56 | 
57 |     # g - Golden year - 1
58 |     # c - Century
59 |     # h - (23 - Epact) mod 30
60 |     # i - Number of days from March 21 to Paschal Full Moon
61 |     # j - Weekday for PFM (0=Sunday, etc)
62 |     # p - Number of days from March 21 to Sunday on or before PFM
63 |     #     (-6 to 28 methods 1 & 3, to 56 for method 2)
64 |     # e - Extra days to add for method 2 (converting Julian
65 |     #     date to Gregorian date)
66 | 
67 |     y = year
68 |     g = y % 19
69 |     e = 0
70 |     if method < 3:
71 |         # Old method
72 |         i = (19*g+15)%30
73 |         j = (y+y//4+i)%7
74 |         if method == 2:
75 |             # Extra dates to convert Julian to Gregorian date
76 |             e = 10
77 |             if y > 1600:
78 |                 e = e+y//100-16-(y//100-16)//4
79 |     else:
80 |         # New method
81 |         c = y//100
82 |         h = (c-c//4-(8*c+13)//25+19*g+15)%30
83 |         i = h-(h//28)*(1-(h//28)*(29//(h+1))*((21-g)//11))
84 |         j = (y+y//4+i+2-c+c//4)%7
85 | 
86 |     # p can be from -6 to 56 corresponding to dates 22 March to 23 May
87 |     # (later dates apply to method 2, although 23 May never actually occurs)
88 |     p = i-j+e
89 |     d = 1+(p+27+(p+6)//40)%31
90 |     m = 3+(p+26)//30
91 |     return datetime.date(int(y),int(m),int(d))
92 | 
93 | 


--------------------------------------------------------------------------------
/dateutil/parser.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/dateutil/parser.py


--------------------------------------------------------------------------------
/dateutil/zoneinfo/__init__.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Copyright (c) 2003-2005  Gustavo Niemeyer <gustavo@niemeyer.net>
 3 | 
 4 | This module offers extensions to the standard python 2.3+
 5 | datetime module.
 6 | """
 7 | from dateutil.tz import tzfile
 8 | from tarfile import TarFile
 9 | import os
10 | 
11 | __author__ = "Gustavo Niemeyer <gustavo@niemeyer.net>"
12 | __license__ = "PSF License"
13 | 
14 | __all__ = ["setcachesize", "gettz", "rebuild"]
15 | 
16 | CACHE = []
17 | CACHESIZE = 10
18 | 
19 | class tzfile(tzfile):
20 |     def __reduce__(self):
21 |         return (gettz, (self._filename,))
22 | 
23 | def getzoneinfofile():
24 |     filenames = os.listdir(os.path.join(os.path.dirname(__file__)))
25 |     filenames.sort()
26 |     filenames.reverse()
27 |     for entry in filenames:
28 |         if entry.startswith("zoneinfo") and ".tar." in entry:
29 |             return os.path.join(os.path.dirname(__file__), entry)
30 |     return None
31 | 
32 | ZONEINFOFILE = getzoneinfofile()
33 | 
34 | del getzoneinfofile
35 | 
36 | def setcachesize(size):
37 |     global CACHESIZE, CACHE
38 |     CACHESIZE = size
39 |     del CACHE[size:]
40 | 
41 | def gettz(name):
42 |     tzinfo = None
43 |     if ZONEINFOFILE:
44 |         for cachedname, tzinfo in CACHE:
45 |             if cachedname == name:
46 |                 break
47 |         else:
48 |             tf = TarFile.open(ZONEINFOFILE)
49 |             try:
50 |                 zonefile = tf.extractfile(name)
51 |             except KeyError:
52 |                 tzinfo = None
53 |             else:
54 |                 tzinfo = tzfile(zonefile)
55 |             tf.close()
56 |             CACHE.insert(0, (name, tzinfo))
57 |             del CACHE[CACHESIZE:]
58 |     return tzinfo
59 | 
60 | def rebuild(filename, tag=None, format="gz"):
61 |     import tempfile, shutil
62 |     tmpdir = tempfile.mkdtemp()
63 |     zonedir = os.path.join(tmpdir, "zoneinfo")
64 |     moduledir = os.path.dirname(__file__)
65 |     if tag: tag = "-"+tag
66 |     targetname = "zoneinfo%s.tar.%s" % (tag, format)
67 |     try:
68 |         tf = TarFile.open(filename)
69 |         for name in tf.getnames():
70 |             if not (name.endswith(".sh") or
71 |                     name.endswith(".tab") or
72 |                     name == "leapseconds"):
73 |                 tf.extract(name, tmpdir)
74 |                 filepath = os.path.join(tmpdir, name)
75 |                 os.system("zic -d %s %s" % (zonedir, filepath))
76 |         tf.close()
77 |         target = os.path.join(moduledir, targetname)
78 |         for entry in os.listdir(moduledir):
79 |             if entry.startswith("zoneinfo") and ".tar." in entry:
80 |                 os.unlink(os.path.join(moduledir, entry))
81 |         tf = TarFile.open(target, "w:%s" % format)
82 |         for entry in os.listdir(zonedir):
83 |             entrypath = os.path.join(zonedir, entry)
84 |             tf.add(entrypath, entry)
85 |         tf.close()
86 |     finally:
87 |         shutil.rmtree(tmpdir)
88 | 


--------------------------------------------------------------------------------
/dateutil/zoneinfo/zoneinfo-2010g.tar.gz:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/dateutil/zoneinfo/zoneinfo-2010g.tar.gz


--------------------------------------------------------------------------------
/favicon.ico:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/favicon.ico


--------------------------------------------------------------------------------
/hfeed.html:
--------------------------------------------------------------------------------
  1 | <html>
  2 | <head><title>{{feed.title}}</title>
  3 | <meta charset="utf-8">
  4 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
  5 | <link href="styles/hfeed.css" media="all" rel="stylesheet" type="text/css" />
  6 | <script src="static/fragmention.js"></script>
  7 | </head>
  8 | <body class="h-feed">
  9 | <h1 class="p-name"><a class="u-url" href="{{feed.link}}">{{feed.title}}</a></h1>
 10 | {% if feed.subtitle_detail and feed.subtitle_detail.type=="text/plain" %}<h2 class="p-summary">{{feed.subtitle}}</h2>
 11 | {% else %}<h2 class="e-summary">{% autoescape false %}{{feed.subtitle}}{% endautoescape %}</h2>
 12 | {% endif %}
 13 | {% if feed.author_detail %}
 14 | <p class="p-author h-card">
 15 | {% if feed.image %}
 16 | <img src="{{feed.image.href}}" class="u-photo" />
 17 | {% endif %}
 18 | {% for link in feed.links %}
 19 | 	{% if link.type.split('/')[0] == 'image' and link.rel=='avatar' %}
 20 | 		<img alt="" class="u-photo" src="{{link.href}}" />
 21 | 	{% endif %}
 22 | {% endfor %}
 23 | <a href="{{feed.author_detail.href}}">{{feed.author_detail.name}}</a>
 24 | </p>
 25 | {% endif %}
 26 | {% for entry in entries %}
 27 | <details class="h-entry" {% if entry.link == entries[0].link %}open{% endif %}>
 28 | <summary class="p-name"><a class="u-url" href="{{entry.link}}">{% autoescape false %}{{entry.title}}{% endautoescape %}</a></summary>
 29 | <div class="e-content">
 30 | {% if entry.summary and entry.content %}
 31 | 	<span class="e-summary">
 32 | 	{% autoescape false %}
 33 | 	{{entry.summary}}
 34 | 	{% endautoescape %}
 35 | 	{% if entry.content[0].value.startswith(entry.summary) %}
 36 | 		{% autoescape false %}
 37 | 		{{entry.content[0].value.split(entry.summary)[1] }}
 38 | 		{% endautoescape %}
 39 | 	{% else %}
 40 | 		{% autoescape false %}
 41 | 		{{entry.content[0].value}}
 42 | 		{% endautoescape %}
 43 | 	{% endif %}
 44 | {% elif entry.content %}
 45 | 	{% autoescape false %}
 46 | 	{{entry.content[0].value}}
 47 | 	{% endautoescape %}
 48 | {% elif entry.summary %}
 49 | 	<span class="e-summary">
 50 | 	{% autoescape false %}
 51 | 	{{entry.summary}}
 52 | 	{% endautoescape %}
 53 | 	</span>
 54 | {% endif %}
 55 | 
 56 | {% for link in entry.links %}
 57 | 	{% if link.type == 'audio/mpeg' or link.type == 'audio/mp3' or (link.href and link.href.endswith(".mp3")) %}
 58 | 		<p><audio class="u-audio" src="{{link.href}}" controls preload=none ><a href="{{link.href}}">audio</a></audio>
 59 | 	{% endif %}
 60 | 	{% if link.type == 'video/x-m4v' or link.type == 'video/x-mp4' or link.type == 'video/mp4' %}
 61 | 		<p><video class="u-video" src="{{link.href}}" controls preload=none ><a href="{{link.href}}">video</a></video>
 62 | 	{% endif %}
 63 | 	{% if link.type and link.type.split('/')[0] == 'image' and link.rel not in ['avatar','header'] %}
 64 | 		<p><a href="{{link.href}}"><img alt="" class="u-photo" src="{{link.href}}" /></a>
 65 | 	{% endif %}
 66 | {% endfor %}
 67 | </div>
 68 | {% if entry.published %}
 69 | <p><time class="dt-published" datetime="{{entry.iso_published}}">Published: {{entry.human_published}}</time> 
 70 | {% endif %}
 71 | {% if entry.updated %}
 72 | <p {% if entry.updated==entry.published %} style="display:none" {% endif %}><time class="dt-updated" datetime="{{entry.iso_updated}}">Updated: {{entry.human_updated}}</time> 
 73 | {% endif %}
 74 | {% if entry.authors %}
 75 | <ul class="authors"> by 
 76 | {% for author in entry.authors %}
 77 | <li class="p-author">{{author.name}}
 78 | {% endfor %}
 79 | </ul>
 80 | {% else %}
 81 | {% if entry.author_detail %}
 82 | {% if entry.author_detail.href %}
 83 | <p>by <a class="p-author h-card" href="{{entry.author_detail.href}}">
 84 | {% for link in entry.links %}
 85 | 	{% if link.type.split('/')[0] == 'image' and link.rel=='avatar' %}
 86 | 		<img alt="" class="u-photo" src="{{link.href}}" />
 87 | 	{% endif %}
 88 | {% endfor %}
 89 | {{entry.author_detail.name}}</a>
 90 | {% else %}
 91 | {% autoescape false %}
 92 | by <span class="p-author h-card">{{entry.author_detail.name}}</span>
 93 | {% endautoescape %}
 94 | {% endif %}
 95 | {% endif %}
 96 | {% endif %}
 97 | </details>
 98 | <hr>
 99 | {% endfor %}
100 | {% if raw == 'on' %}
101 | <code>{{feeds}}
102 | <p>{{feed}}
103 | <p>
104 | {{entries}}
105 | </code>
106 | {% endif %}
107 | </body>
108 | </html>


--------------------------------------------------------------------------------
/hfeedello.html:
--------------------------------------------------------------------------------
 1 | <html>
 2 | <head><title>unmunged ello for {{feed.name}}</title>
 3 | <meta charset="utf-8">
 4 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 5 | <link href="styles/hfeed.css" media="all" rel="stylesheet" type="text/css" />
 6 | <script src="static/fragmention.js"></script>
 7 | </head>
 8 | <body class="h-feed">
 9 | <h1 class="p-name"><a class="u-url" href="https://ello.co/{{feed.username}}">{{feed.name}}</a></h1>
10 | <p class="p-author h-card">
11 | <img src="{{feed.avatar_url}}" class="u-photo" />
12 | <h2 class="p-name">{{feed.name}}</h2>
13 | <ul>
14 | {% for entry in feed %}
15 | <article class="h-entry">
16 | {% for bodypart in entry.body %}
17 | {% if bodypart.kind=="text" %}
18 | <div class="e-content">
19 | {% autoescape false %}
20 | {{bodypart.data}}
21 | {% endautoescape %}
22 | </div>
23 | {% endif %}
24 | {% if bodypart.kind=="image" %}
25 | <div class="e-content">
26 | <img class="u-photo" width=100% src="{{bodypart.data.url}}" alt="{{bodypart.data.alt}}" />
27 | </div>
28 | {% endif %}
29 | {% endfor %}
30 | {% if entry.created_at %}
31 | <p><time class="dt-published" datetime="{{entry.created_at}}">Created: {{entry.created_at}}</time> 
32 | {% endif %}
33 | </article>
34 | <hr>
35 | {% endfor %}
36 | {% if raw == 'on' %}
37 | <code>{{feeds}}
38 | <p>{{feed}}
39 | <p>
40 | {{entries}}
41 | </code>
42 | {% endif %}
43 | </body>
44 | </html>


--------------------------------------------------------------------------------
/hfeedmasto.html:
--------------------------------------------------------------------------------
 1 | <html>
 2 | <head><title>{{feed.title}}</title>
 3 | <meta charset="utf-8">
 4 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 5 | <link href="styles/mastoview.css" media="all" rel="stylesheet" type="text/css" />
 6 | <script src="static/fragmention.js"></script>
 7 | <link rel="stylesheet" href="styles/awesomplete.css" />
 8 | <script src="/static/awesomplete.min.js" async></script>
 9 | </head>
10 | <body class="h-feed">
11 | <div class="top">    
12 | <form action="/mastoview" method="get">
13 |   <input name="url" class="awesomplete" list="mylist" value="{{domain}}"  data-minchars=1  data-maxitems=20/>
14 | 	<datalist id="mylist">
15 | 	{% for instance in instances %}
16 | 	  <option>{{instance["name"]}}</option>
17 | 	{% endfor %}
18 | 	</datalist>      
19 |   <select name="view">
20 |     <option value="local" {% if view=="local" %}selected {% endif %}>Local</option>
21 |     <option value="federated" {% if view=="federated" %}selected {% endif %}>Federated</option>
22 |   </select>
23 |   <button type="submit" value="preview">Preview</button>
24 | </form>
25 | <a href="/mastoview?random=1"><button>random instance</button></a>
26 | <h1 class="p-name"><a class="u-url" href="{{feed.url}}">{{feed.name}}</a></h1>
27 | </div>
28 | <h2>{{error}}</h2>
29 | <div class="entries">
30 | {% for entry in entries %}
31 | <div  class="h-entry entry">
32 | <div class="p-author h-card header">
33 | <img src="{{entry.account.avatar}}" class="u-photo" />
34 | <a class="p-name" href="{{entry.account.url}}">{{entry.account.display_name or entry.account.username}}</a> @<span class="p-nickname">{% autoescape false %}{{entry.account.acct}}{% endautoescape %}</span> 
35 | </div>
36 | {% if entry.spoiler_text!="" %}
37 | <details>
38 | <summary class="p-summary">{% autoescape false %}{{entry.spoiler_text}}{% endautoescape %} <span class="showmore">Show More</span></summary>
39 | {% endif %}
40 | 
41 | <div class="e-content content">
42 | {% if entry.content %}
43 | 	{% autoescape false %}
44 | 	{{entry.content}}
45 | 	{% endautoescape %}
46 | {% endif %}
47 | </div>
48 | {% if entry.nsfw_hide_media and entry.media_attachments %}
49 | <details><summary>Show NSFW media</summary>
50 | {% endif %}
51 | {% for media in entry.media_attachments %}
52 | <figure ><img class="u-photo" src="{{media.preview_url}}" /></figure>
53 | {% endfor %}
54 | {% if entry.nsfw_hide_media %}
55 | </details>
56 | {% endif %}
57 | {% if entry.spoiler_text!="" %}
58 | </details>
59 | {% endif %}
60 | <div class="footer"><a class="u-url" href="{{entry.url}}"><time class="dt-published" datetime="{{entry.created_at}}">{{entry.humancreated}}</time></a></div> 
61 | </div>
62 | {% endfor %}
63 | </div>
64 | </body>
65 | </html>


--------------------------------------------------------------------------------
/hovercard.html:
--------------------------------------------------------------------------------
 1 | <html>
 2 | <head><title>{{" ".join(item.properties.name)}}</title>
 3 | <meta charset="utf-8">
 4 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 5 | <link href="styles/hovercard.css" media="all" rel="stylesheet" type="text/css" />
 6 | </head>
 7 | <body>
 8 | <div class="{{item.type[0]}} indiecard">
 9 | <h1 >{% if item.properties.photo %}
10 | <a class="figure" href="{{url}}"><img src="{{item.properties.photo[0]}}" class="u-photo" /></a>
11 | {% endif %}
12 | <a class="u-url p-name" href="{{url}}">
13 | <svg width="100%" height="100%"><text x="0%"  y="80%" font-size="30vh"  textLength="100%" lengthAdjust="spacingAndGlyphs">{{" ".join(item.properties.name)}}</text></svg>
14 | </a></h1>
15 | {% if item.properties.summary %}
16 | <h2 class="p-summary">{{" ".join(item.properties.summary)}}</h2>
17 | {% elif item.properties.note %}
18 | {% if item.properties.note[0].html %}
19 | {% autoescape false %}
20 | <h2 class="e-note">{{item.properties.note[0].html}}</h2>
21 | {% endautoescape %}
22 | {% else %}
23 | <h2 class="p-note">{{" ".join(item.properties.note)}}</h2>
24 | {% endif %}
25 | {% endif %}
26 | </div>
27 | </body>
28 | </html>


--------------------------------------------------------------------------------
/hovercard2.html:
--------------------------------------------------------------------------------
 1 | <html>
 2 | <head><title>{{name}}</title>
 3 | <meta charset="utf-8">
 4 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 5 | <link href="styles/hovercard2.css" media="all" rel="stylesheet" type="text/css" />
 6 | </head>
 7 | <body>
 8 | <div class="{{type}} indiecard">
 9 | {% if banner %}
10 | <div class="u-featured">
11 | <img src={{banner}} />
12 | </div>
13 | {% endif %}
14 | <h1 >{% if photo %}
15 | <a class="figure" href="{{url}}"><img src="{{photo}}" class="u-photo" /></a>
16 | {% endif %}
17 | <a class="u-url p-name" href="{{url}}">
18 | <svg width="100%" height="100%"><text x="0%"  y="80%" font-size="30vh"  textLength="100%" lengthAdjust="spacingAndGlyphs">{{name}}</text></svg>
19 | </a></h1>
20 | {% if summary %}
21 | {% autoescape false %}
22 | <h2 class="e-summary">{{summary}}</h2>
23 | {% endautoescape  %}
24 | {% endif %}
25 | {% if org %}
26 | {% autoescape false %}
27 | <h3 class="p-org h-card">{{org}}</h3>
28 | {% endautoescape  %}
29 | {% endif %}
30 | 
31 | {% if entries %}
32 | <div class="h-feed">
33 | {% for entry in entries %}
34 | <div class="h-entry"><a href="{{entry.url}}"><h3 class="e-name">{{entry.name}}</h3></a>
35 | {% if entry.featured %}
36 | <div class="u-featured">
37 | <img  src="{{entry.featured}}" />
38 | </div>
39 | {% elif  entry.photo %}
40 | <div class="figure"><img class="u-photo" src="{{entry.photo}}" /></div>
41 | {% endif %}
42 | <p class="e-summary">{{entry.summary}}</p>
43 | </div>
44 | {% endfor %}
45 | </div>
46 | {% endif %}
47 | </div>
48 | </body>
49 | </html>


--------------------------------------------------------------------------------
/hovertest.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | {% autoescape true %}
 3 | <html>
 4 | <head><title>hovercard test</title>
 5 | <meta charset="utf-8">
 6 | <meta name="mobile-web-app-capable" content="yes" />
 7 | <link href="styles/hfeed.css" media="all" rel="stylesheet" type="text/css" />
 8 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 9 | <script src="static/fragmention.js"></script>
10 | <style>
11 | body { display: inline; }
12 | </style>
13 | </head>
14 |   <body>
15 | {% for url in urls %}
16 |     <a href="/mf2?url={{url}}&pretty=on" target="unmung"> <iframe src ="/hovercard?url={{url}}" height="256" width="320" >{{url}}</iframe></a>
17 | {% endfor %}
18 | </body>
19 | </html>
20 | {% endautoescape %}


--------------------------------------------------------------------------------
/html5lib/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/html5lib/.DS_Store


--------------------------------------------------------------------------------
/html5lib/__init__.py:
--------------------------------------------------------------------------------
 1 | """
 2 | HTML parsing library based on the WHATWG "HTML5"
 3 | specification. The parser is designed to be compatible with existing
 4 | HTML found in the wild and implements well-defined error recovery that
 5 | is largely compatible with modern desktop web browsers.
 6 | 
 7 | Example usage:
 8 | 
 9 | import html5lib
10 | f = open("my_document.html")
11 | tree = html5lib.parse(f)
12 | """
13 | 
14 | from __future__ import absolute_import, division, unicode_literals
15 | 
16 | from .html5parser import HTMLParser, parse, parseFragment
17 | from .treebuilders import getTreeBuilder
18 | from .treewalkers import getTreeWalker
19 | from .serializer import serialize
20 | 
21 | __all__ = ["HTMLParser", "parse", "parseFragment", "getTreeBuilder",
22 |            "getTreeWalker", "serialize"]
23 | __version__ = "0.999999-dev"
24 | 


--------------------------------------------------------------------------------
/html5lib/filters/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/html5lib/filters/__init__.py


--------------------------------------------------------------------------------
/html5lib/filters/_base.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | 
 4 | class Filter(object):
 5 |     def __init__(self, source):
 6 |         self.source = source
 7 | 
 8 |     def __iter__(self):
 9 |         return iter(self.source)
10 | 
11 |     def __getattr__(self, name):
12 |         return getattr(self.source, name)
13 | 


--------------------------------------------------------------------------------
/html5lib/filters/alphabeticalattributes.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from . import _base
 4 | 
 5 | try:
 6 |     from collections import OrderedDict
 7 | except ImportError:
 8 |     from ordereddict import OrderedDict
 9 | 
10 | 
11 | class Filter(_base.Filter):
12 |     def __iter__(self):
13 |         for token in _base.Filter.__iter__(self):
14 |             if token["type"] in ("StartTag", "EmptyTag"):
15 |                 attrs = OrderedDict()
16 |                 for name, value in sorted(token["data"].items(),
17 |                                           key=lambda x: x[0]):
18 |                     attrs[name] = value
19 |                 token["data"] = attrs
20 |             yield token
21 | 


--------------------------------------------------------------------------------
/html5lib/filters/inject_meta_charset.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from . import _base
 4 | 
 5 | 
 6 | class Filter(_base.Filter):
 7 |     def __init__(self, source, encoding):
 8 |         _base.Filter.__init__(self, source)
 9 |         self.encoding = encoding
10 | 
11 |     def __iter__(self):
12 |         state = "pre_head"
13 |         meta_found = (self.encoding is None)
14 |         pending = []
15 | 
16 |         for token in _base.Filter.__iter__(self):
17 |             type = token["type"]
18 |             if type == "StartTag":
19 |                 if token["name"].lower() == "head":
20 |                     state = "in_head"
21 | 
22 |             elif type == "EmptyTag":
23 |                 if token["name"].lower() == "meta":
24 |                     # replace charset with actual encoding
25 |                     has_http_equiv_content_type = False
26 |                     for (namespace, name), value in token["data"].items():
27 |                         if namespace is not None:
28 |                             continue
29 |                         elif name.lower() == 'charset':
30 |                             token["data"][(namespace, name)] = self.encoding
31 |                             meta_found = True
32 |                             break
33 |                         elif name == 'http-equiv' and value.lower() == 'content-type':
34 |                             has_http_equiv_content_type = True
35 |                     else:
36 |                         if has_http_equiv_content_type and (None, "content") in token["data"]:
37 |                             token["data"][(None, "content")] = 'text/html; charset=%s' % self.encoding
38 |                             meta_found = True
39 | 
40 |                 elif token["name"].lower() == "head" and not meta_found:
41 |                     # insert meta into empty head
42 |                     yield {"type": "StartTag", "name": "head",
43 |                            "data": token["data"]}
44 |                     yield {"type": "EmptyTag", "name": "meta",
45 |                            "data": {(None, "charset"): self.encoding}}
46 |                     yield {"type": "EndTag", "name": "head"}
47 |                     meta_found = True
48 |                     continue
49 | 
50 |             elif type == "EndTag":
51 |                 if token["name"].lower() == "head" and pending:
52 |                     # insert meta into head (if necessary) and flush pending queue
53 |                     yield pending.pop(0)
54 |                     if not meta_found:
55 |                         yield {"type": "EmptyTag", "name": "meta",
56 |                                "data": {(None, "charset"): self.encoding}}
57 |                     while pending:
58 |                         yield pending.pop(0)
59 |                     meta_found = True
60 |                     state = "post_head"
61 | 
62 |             if state == "in_head":
63 |                 pending.append(token)
64 |             else:
65 |                 yield token
66 | 


--------------------------------------------------------------------------------
/html5lib/filters/lint.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from . import _base
 4 | from ..constants import cdataElements, rcdataElements, voidElements
 5 | 
 6 | from ..constants import spaceCharacters
 7 | spaceCharacters = "".join(spaceCharacters)
 8 | 
 9 | 
10 | class LintError(Exception):
11 |     pass
12 | 
13 | 
14 | class Filter(_base.Filter):
15 |     def __iter__(self):
16 |         open_elements = []
17 |         contentModelFlag = "PCDATA"
18 |         for token in _base.Filter.__iter__(self):
19 |             type = token["type"]
20 |             if type in ("StartTag", "EmptyTag"):
21 |                 name = token["name"]
22 |                 if contentModelFlag != "PCDATA":
23 |                     raise LintError("StartTag not in PCDATA content model flag: %(tag)s" % {"tag": name})
24 |                 if not isinstance(name, str):
25 |                     raise LintError("Tag name is not a string: %(tag)r" % {"tag": name})
26 |                 if not name:
27 |                     raise LintError("Empty tag name")
28 |                 if type == "StartTag" and name in voidElements:
29 |                     raise LintError("Void element reported as StartTag token: %(tag)s" % {"tag": name})
30 |                 elif type == "EmptyTag" and name not in voidElements:
31 |                     raise LintError("Non-void element reported as EmptyTag token: %(tag)s" % {"tag": token["name"]})
32 |                 if type == "StartTag":
33 |                     open_elements.append(name)
34 |                 for name, value in token["data"]:
35 |                     if not isinstance(name, str):
36 |                         raise LintError("Attribute name is not a string: %(name)r" % {"name": name})
37 |                     if not name:
38 |                         raise LintError("Empty attribute name")
39 |                     if not isinstance(value, str):
40 |                         raise LintError("Attribute value is not a string: %(value)r" % {"value": value})
41 |                 if name in cdataElements:
42 |                     contentModelFlag = "CDATA"
43 |                 elif name in rcdataElements:
44 |                     contentModelFlag = "RCDATA"
45 |                 elif name == "plaintext":
46 |                     contentModelFlag = "PLAINTEXT"
47 | 
48 |             elif type == "EndTag":
49 |                 name = token["name"]
50 |                 if not isinstance(name, str):
51 |                     raise LintError("Tag name is not a string: %(tag)r" % {"tag": name})
52 |                 if not name:
53 |                     raise LintError("Empty tag name")
54 |                 if name in voidElements:
55 |                     raise LintError("Void element reported as EndTag token: %(tag)s" % {"tag": name})
56 |                 start_name = open_elements.pop()
57 |                 if start_name != name:
58 |                     raise LintError("EndTag (%(end)s) does not match StartTag (%(start)s)" % {"end": name, "start": start_name})
59 |                 contentModelFlag = "PCDATA"
60 | 
61 |             elif type == "Comment":
62 |                 if contentModelFlag != "PCDATA":
63 |                     raise LintError("Comment not in PCDATA content model flag")
64 | 
65 |             elif type in ("Characters", "SpaceCharacters"):
66 |                 data = token["data"]
67 |                 if not isinstance(data, str):
68 |                     raise LintError("Attribute name is not a string: %(name)r" % {"name": data})
69 |                 if not data:
70 |                     raise LintError("%(type)s token with empty data" % {"type": type})
71 |                 if type == "SpaceCharacters":
72 |                     data = data.strip(spaceCharacters)
73 |                     if data:
74 |                         raise LintError("Non-space character(s) found in SpaceCharacters token: %(token)r" % {"token": data})
75 | 
76 |             elif type == "Doctype":
77 |                 name = token["name"]
78 |                 if contentModelFlag != "PCDATA":
79 |                     raise LintError("Doctype not in PCDATA content model flag: %(name)s" % {"name": name})
80 |                 if not isinstance(name, str):
81 |                     raise LintError("Tag name is not a string: %(tag)r" % {"tag": name})
82 |                 # XXX: what to do with token["data"] ?
83 | 
84 |             elif type in ("ParseError", "SerializeError"):
85 |                 pass
86 | 
87 |             else:
88 |                 raise LintError("Unknown token type: %(type)s" % {"type": type})
89 | 
90 |             yield token
91 | 


--------------------------------------------------------------------------------
/html5lib/filters/sanitizer.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from . import _base
 4 | from ..sanitizer import HTMLSanitizerMixin
 5 | 
 6 | 
 7 | class Filter(_base.Filter, HTMLSanitizerMixin):
 8 |     def __iter__(self):
 9 |         for token in _base.Filter.__iter__(self):
10 |             token = self.sanitize_token(token)
11 |             if token:
12 |                 yield token
13 | 


--------------------------------------------------------------------------------
/html5lib/filters/whitespace.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | import re
 4 | 
 5 | from . import _base
 6 | from ..constants import rcdataElements, spaceCharacters
 7 | spaceCharacters = "".join(spaceCharacters)
 8 | 
 9 | SPACES_REGEX = re.compile("[%s]+" % spaceCharacters)
10 | 
11 | 
12 | class Filter(_base.Filter):
13 | 
14 |     spacePreserveElements = frozenset(["pre", "textarea"] + list(rcdataElements))
15 | 
16 |     def __iter__(self):
17 |         preserve = 0
18 |         for token in _base.Filter.__iter__(self):
19 |             type = token["type"]
20 |             if type == "StartTag" \
21 |                     and (preserve or token["name"] in self.spacePreserveElements):
22 |                 preserve += 1
23 | 
24 |             elif type == "EndTag" and preserve:
25 |                 preserve -= 1
26 | 
27 |             elif not preserve and type == "SpaceCharacters" and token["data"]:
28 |                 # Test on token["data"] above to not introduce spaces where there were not
29 |                 token["data"] = " "
30 | 
31 |             elif not preserve and type == "Characters":
32 |                 token["data"] = collapse_spaces(token["data"])
33 | 
34 |             yield token
35 | 
36 | 
37 | def collapse_spaces(text):
38 |     return SPACES_REGEX.sub(' ', text)
39 | 


--------------------------------------------------------------------------------
/html5lib/serializer/__init__.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from .. import treewalkers
 4 | 
 5 | from .htmlserializer import HTMLSerializer
 6 | 
 7 | 
 8 | def serialize(input, tree="etree", format="html", encoding=None,
 9 |               **serializer_opts):
10 |     # XXX: Should we cache this?
11 |     walker = treewalkers.getTreeWalker(tree)
12 |     if format == "html":
13 |         s = HTMLSerializer(**serializer_opts)
14 |     else:
15 |         raise ValueError("type must be html")
16 |     return s.render(walker(input), encoding)
17 | 


--------------------------------------------------------------------------------
/html5lib/treeadapters/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/html5lib/treeadapters/__init__.py


--------------------------------------------------------------------------------
/html5lib/treeadapters/sax.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from xml.sax.xmlreader import AttributesNSImpl
 4 | 
 5 | from ..constants import adjustForeignAttributes, unadjustForeignAttributes
 6 | 
 7 | prefix_mapping = {}
 8 | for prefix, localName, namespace in adjustForeignAttributes.values():
 9 |     if prefix is not None:
10 |         prefix_mapping[prefix] = namespace
11 | 
12 | 
13 | def to_sax(walker, handler):
14 |     """Call SAX-like content handler based on treewalker walker"""
15 |     handler.startDocument()
16 |     for prefix, namespace in prefix_mapping.items():
17 |         handler.startPrefixMapping(prefix, namespace)
18 | 
19 |     for token in walker:
20 |         type = token["type"]
21 |         if type == "Doctype":
22 |             continue
23 |         elif type in ("StartTag", "EmptyTag"):
24 |             attrs = AttributesNSImpl(token["data"],
25 |                                      unadjustForeignAttributes)
26 |             handler.startElementNS((token["namespace"], token["name"]),
27 |                                    token["name"],
28 |                                    attrs)
29 |             if type == "EmptyTag":
30 |                 handler.endElementNS((token["namespace"], token["name"]),
31 |                                      token["name"])
32 |         elif type == "EndTag":
33 |             handler.endElementNS((token["namespace"], token["name"]),
34 |                                  token["name"])
35 |         elif type in ("Characters", "SpaceCharacters"):
36 |             handler.characters(token["data"])
37 |         elif type == "Comment":
38 |             pass
39 |         else:
40 |             assert False, "Unknown token type"
41 | 
42 |     for prefix, namespace in prefix_mapping.items():
43 |         handler.endPrefixMapping(prefix)
44 |     handler.endDocument()
45 | 


--------------------------------------------------------------------------------
/html5lib/treebuilders/__init__.py:
--------------------------------------------------------------------------------
 1 | """A collection of modules for building different kinds of tree from
 2 | HTML documents.
 3 | 
 4 | To create a treebuilder for a new type of tree, you need to do
 5 | implement several things:
 6 | 
 7 | 1) A set of classes for various types of elements: Document, Doctype,
 8 | Comment, Element. These must implement the interface of
 9 | _base.treebuilders.Node (although comment nodes have a different
10 | signature for their constructor, see treebuilders.etree.Comment)
11 | Textual content may also be implemented as another node type, or not, as
12 | your tree implementation requires.
13 | 
14 | 2) A treebuilder object (called TreeBuilder by convention) that
15 | inherits from treebuilders._base.TreeBuilder. This has 4 required attributes:
16 | documentClass - the class to use for the bottommost node of a document
17 | elementClass - the class to use for HTML Elements
18 | commentClass - the class to use for comments
19 | doctypeClass - the class to use for doctypes
20 | It also has one required method:
21 | getDocument - Returns the root node of the complete document tree
22 | 
23 | 3) If you wish to run the unit tests, you must also create a
24 | testSerializer method on your treebuilder which accepts a node and
25 | returns a string containing Node and its children serialized according
26 | to the format used in the unittests
27 | """
28 | 
29 | from __future__ import absolute_import, division, unicode_literals
30 | 
31 | from ..utils import default_etree
32 | 
33 | treeBuilderCache = {}
34 | 
35 | 
36 | def getTreeBuilder(treeType, implementation=None, **kwargs):
37 |     """Get a TreeBuilder class for various types of tree with built-in support
38 | 
39 |     treeType - the name of the tree type required (case-insensitive). Supported
40 |                values are:
41 | 
42 |                "dom" - A generic builder for DOM implementations, defaulting to
43 |                        a xml.dom.minidom based implementation.
44 |                "etree" - A generic builder for tree implementations exposing an
45 |                          ElementTree-like interface, defaulting to
46 |                          xml.etree.cElementTree if available and
47 |                          xml.etree.ElementTree if not.
48 |                "lxml" - A etree-based builder for lxml.etree, handling
49 |                         limitations of lxml's implementation.
50 | 
51 |     implementation - (Currently applies to the "etree" and "dom" tree types). A
52 |                       module implementing the tree type e.g.
53 |                       xml.etree.ElementTree or xml.etree.cElementTree."""
54 | 
55 |     treeType = treeType.lower()
56 |     if treeType not in treeBuilderCache:
57 |         if treeType == "dom":
58 |             from . import dom
59 |             # Come up with a sane default (pref. from the stdlib)
60 |             if implementation is None:
61 |                 from xml.dom import minidom
62 |                 implementation = minidom
63 |             # NEVER cache here, caching is done in the dom submodule
64 |             return dom.getDomModule(implementation, **kwargs).TreeBuilder
65 |         elif treeType == "lxml":
66 |             from . import etree_lxml
67 |             treeBuilderCache[treeType] = etree_lxml.TreeBuilder
68 |         elif treeType == "etree":
69 |             from . import etree
70 |             if implementation is None:
71 |                 implementation = default_etree
72 |             # NEVER cache here, caching is done in the etree submodule
73 |             return etree.getETreeModule(implementation, **kwargs).TreeBuilder
74 |         else:
75 |             raise ValueError("""Unrecognised treebuilder "%s" """ % treeType)
76 |     return treeBuilderCache.get(treeType)
77 | 


--------------------------------------------------------------------------------
/html5lib/treewalkers/dom.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from xml.dom import Node
 4 | 
 5 | from . import _base
 6 | 
 7 | 
 8 | class TreeWalker(_base.NonRecursiveTreeWalker):
 9 |     def getNodeDetails(self, node):
10 |         if node.nodeType == Node.DOCUMENT_TYPE_NODE:
11 |             return _base.DOCTYPE, node.name, node.publicId, node.systemId
12 | 
13 |         elif node.nodeType in (Node.TEXT_NODE, Node.CDATA_SECTION_NODE):
14 |             return _base.TEXT, node.nodeValue
15 | 
16 |         elif node.nodeType == Node.ELEMENT_NODE:
17 |             attrs = {}
18 |             for attr in list(node.attributes.keys()):
19 |                 attr = node.getAttributeNode(attr)
20 |                 if attr.namespaceURI:
21 |                     attrs[(attr.namespaceURI, attr.localName)] = attr.value
22 |                 else:
23 |                     attrs[(None, attr.name)] = attr.value
24 |             return (_base.ELEMENT, node.namespaceURI, node.nodeName,
25 |                     attrs, node.hasChildNodes())
26 | 
27 |         elif node.nodeType == Node.COMMENT_NODE:
28 |             return _base.COMMENT, node.nodeValue
29 | 
30 |         elif node.nodeType in (Node.DOCUMENT_NODE, Node.DOCUMENT_FRAGMENT_NODE):
31 |             return (_base.DOCUMENT,)
32 | 
33 |         else:
34 |             return _base.UNKNOWN, node.nodeType
35 | 
36 |     def getFirstChild(self, node):
37 |         return node.firstChild
38 | 
39 |     def getNextSibling(self, node):
40 |         return node.nextSibling
41 | 
42 |     def getParentNode(self, node):
43 |         return node.parentNode
44 | 


--------------------------------------------------------------------------------
/html5lib/treewalkers/genshistream.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from genshi.core import QName
 4 | from genshi.core import START, END, XML_NAMESPACE, DOCTYPE, TEXT
 5 | from genshi.core import START_NS, END_NS, START_CDATA, END_CDATA, PI, COMMENT
 6 | 
 7 | from . import _base
 8 | 
 9 | from ..constants import voidElements, namespaces
10 | 
11 | 
12 | class TreeWalker(_base.TreeWalker):
13 |     def __iter__(self):
14 |         # Buffer the events so we can pass in the following one
15 |         previous = None
16 |         for event in self.tree:
17 |             if previous is not None:
18 |                 for token in self.tokens(previous, event):
19 |                     yield token
20 |             previous = event
21 | 
22 |         # Don't forget the final event!
23 |         if previous is not None:
24 |             for token in self.tokens(previous, None):
25 |                 yield token
26 | 
27 |     def tokens(self, event, next):
28 |         kind, data, pos = event
29 |         if kind == START:
30 |             tag, attribs = data
31 |             name = tag.localname
32 |             namespace = tag.namespace
33 |             converted_attribs = {}
34 |             for k, v in attribs:
35 |                 if isinstance(k, QName):
36 |                     converted_attribs[(k.namespace, k.localname)] = v
37 |                 else:
38 |                     converted_attribs[(None, k)] = v
39 | 
40 |             if namespace == namespaces["html"] and name in voidElements:
41 |                 for token in self.emptyTag(namespace, name, converted_attribs,
42 |                                            not next or next[0] != END
43 |                                            or next[1] != tag):
44 |                     yield token
45 |             else:
46 |                 yield self.startTag(namespace, name, converted_attribs)
47 | 
48 |         elif kind == END:
49 |             name = data.localname
50 |             namespace = data.namespace
51 |             if name not in voidElements:
52 |                 yield self.endTag(namespace, name)
53 | 
54 |         elif kind == COMMENT:
55 |             yield self.comment(data)
56 | 
57 |         elif kind == TEXT:
58 |             for token in self.text(data):
59 |                 yield token
60 | 
61 |         elif kind == DOCTYPE:
62 |             yield self.doctype(*data)
63 | 
64 |         elif kind in (XML_NAMESPACE, DOCTYPE, START_NS, END_NS,
65 |                       START_CDATA, END_CDATA, PI):
66 |             pass
67 | 
68 |         else:
69 |             yield self.unknown(kind)
70 | 


--------------------------------------------------------------------------------
/html5lib/treewalkers/pulldom.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from xml.dom.pulldom import START_ELEMENT, END_ELEMENT, \
 4 |     COMMENT, IGNORABLE_WHITESPACE, CHARACTERS
 5 | 
 6 | from . import _base
 7 | 
 8 | from ..constants import voidElements
 9 | 
10 | 
11 | class TreeWalker(_base.TreeWalker):
12 |     def __iter__(self):
13 |         ignore_until = None
14 |         previous = None
15 |         for event in self.tree:
16 |             if previous is not None and \
17 |                     (ignore_until is None or previous[1] is ignore_until):
18 |                 if previous[1] is ignore_until:
19 |                     ignore_until = None
20 |                 for token in self.tokens(previous, event):
21 |                     yield token
22 |                     if token["type"] == "EmptyTag":
23 |                         ignore_until = previous[1]
24 |             previous = event
25 |         if ignore_until is None or previous[1] is ignore_until:
26 |             for token in self.tokens(previous, None):
27 |                 yield token
28 |         elif ignore_until is not None:
29 |             raise ValueError("Illformed DOM event stream: void element without END_ELEMENT")
30 | 
31 |     def tokens(self, event, next):
32 |         type, node = event
33 |         if type == START_ELEMENT:
34 |             name = node.nodeName
35 |             namespace = node.namespaceURI
36 |             attrs = {}
37 |             for attr in list(node.attributes.keys()):
38 |                 attr = node.getAttributeNode(attr)
39 |                 attrs[(attr.namespaceURI, attr.localName)] = attr.value
40 |             if name in voidElements:
41 |                 for token in self.emptyTag(namespace,
42 |                                            name,
43 |                                            attrs,
44 |                                            not next or next[1] is not node):
45 |                     yield token
46 |             else:
47 |                 yield self.startTag(namespace, name, attrs)
48 | 
49 |         elif type == END_ELEMENT:
50 |             name = node.nodeName
51 |             namespace = node.namespaceURI
52 |             if name not in voidElements:
53 |                 yield self.endTag(namespace, name)
54 | 
55 |         elif type == COMMENT:
56 |             yield self.comment(node.nodeValue)
57 | 
58 |         elif type in (IGNORABLE_WHITESPACE, CHARACTERS):
59 |             for token in self.text(node.nodeValue):
60 |                 yield token
61 | 
62 |         else:
63 |             yield self.unknown(type)
64 | 


--------------------------------------------------------------------------------
/html5lib/trie/__init__.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from .py import Trie as PyTrie
 4 | 
 5 | Trie = PyTrie
 6 | 
 7 | try:
 8 |     from .datrie import Trie as DATrie
 9 | except ImportError:
10 |     pass
11 | else:
12 |     Trie = DATrie
13 | 


--------------------------------------------------------------------------------
/html5lib/trie/_base.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from collections import Mapping
 4 | 
 5 | 
 6 | class Trie(Mapping):
 7 |     """Abstract base class for tries"""
 8 | 
 9 |     def keys(self, prefix=None):
10 |         keys = super().keys()
11 | 
12 |         if prefix is None:
13 |             return set(keys)
14 | 
15 |         # Python 2.6: no set comprehensions
16 |         return set([x for x in keys if x.startswith(prefix)])
17 | 
18 |     def has_keys_with_prefix(self, prefix):
19 |         for key in self.keys():
20 |             if key.startswith(prefix):
21 |                 return True
22 | 
23 |         return False
24 | 
25 |     def longest_prefix(self, prefix):
26 |         if prefix in self:
27 |             return prefix
28 | 
29 |         for i in range(1, len(prefix) + 1):
30 |             if prefix[:-i] in self:
31 |                 return prefix[:-i]
32 | 
33 |         raise KeyError(prefix)
34 | 
35 |     def longest_prefix_item(self, prefix):
36 |         lprefix = self.longest_prefix(prefix)
37 |         return (lprefix, self[lprefix])
38 | 


--------------------------------------------------------------------------------
/html5lib/trie/datrie.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | 
 3 | from datrie import Trie as DATrie
 4 | from six import text_type
 5 | 
 6 | from ._base import Trie as ABCTrie
 7 | 
 8 | 
 9 | class Trie(ABCTrie):
10 |     def __init__(self, data):
11 |         chars = set()
12 |         for key in data.keys():
13 |             if not isinstance(key, text_type):
14 |                 raise TypeError("All keys must be strings")
15 |             for char in key:
16 |                 chars.add(char)
17 | 
18 |         self._data = DATrie("".join(chars))
19 |         for key, value in data.items():
20 |             self._data[key] = value
21 | 
22 |     def __contains__(self, key):
23 |         return key in self._data
24 | 
25 |     def __len__(self):
26 |         return len(self._data)
27 | 
28 |     def __iter__(self):
29 |         raise NotImplementedError()
30 | 
31 |     def __getitem__(self, key):
32 |         return self._data[key]
33 | 
34 |     def keys(self, prefix=None):
35 |         return self._data.keys(prefix)
36 | 
37 |     def has_keys_with_prefix(self, prefix):
38 |         return self._data.has_keys_with_prefix(prefix)
39 | 
40 |     def longest_prefix(self, prefix):
41 |         return self._data.longest_prefix(prefix)
42 | 
43 |     def longest_prefix_item(self, prefix):
44 |         return self._data.longest_prefix_item(prefix)
45 | 


--------------------------------------------------------------------------------
/html5lib/trie/py.py:
--------------------------------------------------------------------------------
 1 | from __future__ import absolute_import, division, unicode_literals
 2 | from six import text_type
 3 | 
 4 | from bisect import bisect_left
 5 | 
 6 | from ._base import Trie as ABCTrie
 7 | 
 8 | 
 9 | class Trie(ABCTrie):
10 |     def __init__(self, data):
11 |         if not all(isinstance(x, text_type) for x in data.keys()):
12 |             raise TypeError("All keys must be strings")
13 | 
14 |         self._data = data
15 |         self._keys = sorted(data.keys())
16 |         self._cachestr = ""
17 |         self._cachepoints = (0, len(data))
18 | 
19 |     def __contains__(self, key):
20 |         return key in self._data
21 | 
22 |     def __len__(self):
23 |         return len(self._data)
24 | 
25 |     def __iter__(self):
26 |         return iter(self._data)
27 | 
28 |     def __getitem__(self, key):
29 |         return self._data[key]
30 | 
31 |     def keys(self, prefix=None):
32 |         if prefix is None or prefix == "" or not self._keys:
33 |             return set(self._keys)
34 | 
35 |         if prefix.startswith(self._cachestr):
36 |             lo, hi = self._cachepoints
37 |             start = i = bisect_left(self._keys, prefix, lo, hi)
38 |         else:
39 |             start = i = bisect_left(self._keys, prefix)
40 | 
41 |         keys = set()
42 |         if start == len(self._keys):
43 |             return keys
44 | 
45 |         while self._keys[i].startswith(prefix):
46 |             keys.add(self._keys[i])
47 |             i += 1
48 | 
49 |         self._cachestr = prefix
50 |         self._cachepoints = (start, i)
51 | 
52 |         return keys
53 | 
54 |     def has_keys_with_prefix(self, prefix):
55 |         if prefix in self._data:
56 |             return True
57 | 
58 |         if prefix.startswith(self._cachestr):
59 |             lo, hi = self._cachepoints
60 |             i = bisect_left(self._keys, prefix, lo, hi)
61 |         else:
62 |             i = bisect_left(self._keys, prefix)
63 | 
64 |         if i == len(self._keys):
65 |             return False
66 | 
67 |         return self._keys[i].startswith(prefix)
68 | 


--------------------------------------------------------------------------------
/html5lib/utils.py:
--------------------------------------------------------------------------------
  1 | from __future__ import absolute_import, division, unicode_literals
  2 | 
  3 | from types import ModuleType
  4 | 
  5 | from six import text_type
  6 | 
  7 | try:
  8 |     import xml.etree.cElementTree as default_etree
  9 | except ImportError:
 10 |     import xml.etree.ElementTree as default_etree
 11 | 
 12 | 
 13 | __all__ = ["default_etree", "MethodDispatcher", "isSurrogatePair",
 14 |            "surrogatePairToCodepoint", "moduleFactoryFactory",
 15 |            "supports_lone_surrogates"]
 16 | 
 17 | 
 18 | # Platforms not supporting lone surrogates (\uD800-\uDFFF) should be
 19 | # caught by the below test. In general this would be any platform
 20 | # using UTF-16 as its encoding of unicode strings, such as
 21 | # Jython. This is because UTF-16 itself is based on the use of such
 22 | # surrogates, and there is no mechanism to further escape such
 23 | # escapes.
 24 | try:
 25 |     _x = eval('"\\uD800"')
 26 |     if not isinstance(_x, text_type):
 27 |         # We need this with u"" because of http://bugs.jython.org/issue2039
 28 |         _x = eval('u"\\uD800"')
 29 |         assert isinstance(_x, text_type)
 30 | except:
 31 |     supports_lone_surrogates = False
 32 | else:
 33 |     supports_lone_surrogates = True
 34 | 
 35 | 
 36 | class MethodDispatcher(dict):
 37 |     """Dict with 2 special properties:
 38 | 
 39 |     On initiation, keys that are lists, sets or tuples are converted to
 40 |     multiple keys so accessing any one of the items in the original
 41 |     list-like object returns the matching value
 42 | 
 43 |     md = MethodDispatcher({("foo", "bar"):"baz"})
 44 |     md["foo"] == "baz"
 45 | 
 46 |     A default value which can be set through the default attribute.
 47 |     """
 48 | 
 49 |     def __init__(self, items=()):
 50 |         # Using _dictEntries instead of directly assigning to self is about
 51 |         # twice as fast. Please do careful performance testing before changing
 52 |         # anything here.
 53 |         _dictEntries = []
 54 |         for name, value in items:
 55 |             if type(name) in (list, tuple, frozenset, set):
 56 |                 for item in name:
 57 |                     _dictEntries.append((item, value))
 58 |             else:
 59 |                 _dictEntries.append((name, value))
 60 |         dict.__init__(self, _dictEntries)
 61 |         self.default = None
 62 | 
 63 |     def __getitem__(self, key):
 64 |         return dict.get(self, key, self.default)
 65 | 
 66 | 
 67 | # Some utility functions to dal with weirdness around UCS2 vs UCS4
 68 | # python builds
 69 | 
 70 | def isSurrogatePair(data):
 71 |     return (len(data) == 2 and
 72 |             ord(data[0]) >= 0xD800 and ord(data[0]) <= 0xDBFF and
 73 |             ord(data[1]) >= 0xDC00 and ord(data[1]) <= 0xDFFF)
 74 | 
 75 | 
 76 | def surrogatePairToCodepoint(data):
 77 |     char_val = (0x10000 + (ord(data[0]) - 0xD800) * 0x400 +
 78 |                 (ord(data[1]) - 0xDC00))
 79 |     return char_val
 80 | 
 81 | # Module Factory Factory (no, this isn't Java, I know)
 82 | # Here to stop this being duplicated all over the place.
 83 | 
 84 | 
 85 | def moduleFactoryFactory(factory):
 86 |     moduleCache = {}
 87 | 
 88 |     def moduleFactory(baseModule, *args, **kwargs):
 89 |         if isinstance(ModuleType.__name__, type("")):
 90 |             name = "_%s_factory" % baseModule.__name__
 91 |         else:
 92 |             name = b"_%s_factory" % baseModule.__name__
 93 | 
 94 |         if name in moduleCache:
 95 |             return moduleCache[name]
 96 |         else:
 97 |             mod = ModuleType(name)
 98 |             objs = factory(baseModule, *args, **kwargs)
 99 |             mod.__dict__.update(objs)
100 |             moduleCache[name] = mod
101 |             return mod
102 | 
103 |     return moduleFactory
104 | 


--------------------------------------------------------------------------------
/humanize/__init__.py:
--------------------------------------------------------------------------------
 1 | VERSION = (0,4)
 2 | 
 3 | from humanize.time import *
 4 | from humanize.number import *
 5 | from humanize.filesize import *
 6 | from humanize.i18n import activate, deactivate
 7 | 
 8 | __all__ = ['VERSION', 'naturalday', 'naturaltime', 'ordinal', 'intword',
 9 |     'naturaldelta', 'intcomma', 'apnumber', 'fractional', 'naturalsize',
10 |     'activate', 'deactivate', 'naturaldate']
11 | 


--------------------------------------------------------------------------------
/humanize/compat.py:
--------------------------------------------------------------------------------
1 | import sys
2 | 
3 | if sys.version_info < (3,):
4 |     string_types = (basestring,)
5 | else:
6 |     string_types = (str,)
7 | 
8 | 


--------------------------------------------------------------------------------
/humanize/filesize.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | # -*- coding: utf-8 -*-
 3 | 
 4 | """Bits & Bytes related humanization."""
 5 | 
 6 | suffixes = {
 7 |     'decimal': ('kB', 'MB', 'GB', 'TB', 'PB', 'EB', 'ZB', 'YB'),
 8 |     'binary': ('KiB', 'MiB', 'GiB', 'TiB', 'PiB', 'EiB', 'ZiB', 'YiB'),
 9 |     'gnu': "KMGTPEZY",
10 | }
11 | 
12 | 
13 | def naturalsize(value, binary=False, gnu=False, format='%.1f'):
14 |     """Format a number of byteslike a human readable filesize (eg. 10 kB).  By
15 |     default, decimal suffixes (kB, MB) are used.  Passing binary=true will use
16 |     binary suffixes (KiB, MiB) are used and the base will be 2**10 instead of
17 |     10**3.  If ``gnu`` is True, the binary argument is ignored and GNU-style
18 |     (ls -sh style) prefixes are used (K, M) with the 2**10 definition.
19 |     Non-gnu modes are compatible with jinja2's ``filesizeformat`` filter."""
20 |     if gnu: suffix = suffixes['gnu']
21 |     elif binary: suffix = suffixes['binary']
22 |     else: suffix = suffixes['decimal']
23 | 
24 |     base = 1024 if (gnu or binary) else 1000
25 |     bytes = float(value)
26 | 
27 |     if bytes == 1 and not gnu: return '1 Byte'
28 |     elif bytes < base and not gnu: return '%d Bytes' % bytes
29 |     elif bytes < base and gnu: return '%dB' % bytes
30 | 
31 |     for i,s in enumerate(suffix):
32 |         unit = base ** (i+2)
33 |         if bytes < unit and not gnu:
34 |             return (format + ' %s') % ((base * bytes / unit), s)
35 |         elif bytes < unit and gnu:
36 |             return (format + '%s') % ((base * bytes / unit), s)
37 |     if gnu:
38 |         return (format + '%s') % ((base * bytes / unit), s)
39 |     return (format + ' %s') % ((base * bytes / unit), s)
40 | 
41 | 


--------------------------------------------------------------------------------
/humanize/i18n.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | import gettext as gettext_module
 3 | from threading import local
 4 | import os.path
 5 | 
 6 | __all__ = ['activate', 'deactivate', 'gettext', 'ngettext']
 7 | 
 8 | _TRANSLATIONS = {None: gettext_module.NullTranslations()}
 9 | _CURRENT = local()
10 | 
11 | _DEFAULT_LOCALE_PATH = os.path.join(os.path.dirname(__file__), 'locale')
12 | 
13 | 
14 | def get_translation():
15 |     try:
16 |         return _TRANSLATIONS[_CURRENT.locale]
17 |     except (AttributeError, KeyError):
18 |         return _TRANSLATIONS[None]
19 | 
20 | 
21 | def activate(locale, path=None):
22 |     """Set 'locale' as current locale. Search for locale in directory 'path'
23 |     @param locale: language name, eg 'en_GB'"""
24 |     if path is None:
25 |         path = _DEFAULT_LOCALE_PATH
26 |     if locale not in _TRANSLATIONS:
27 |         translation = gettext_module.translation('humanize', path, [locale])
28 |         _TRANSLATIONS[locale] = translation
29 |     _CURRENT.locale = locale
30 |     return _TRANSLATIONS[locale]
31 | 
32 | 
33 | def deactivate():
34 |     _CURRENT.locale = None
35 | 
36 | 
37 | def gettext(message):
38 |     return get_translation().gettext(message)
39 | 
40 | 
41 | def pgettext(msgctxt, message):
42 |     """'Particular gettext' function.
43 |     It works with 'msgctxt' .po modifiers and allow duplicate keys with
44 |     different translations.
45 |     Python 2 don't have support for this GNU gettext function, so we
46 |     reimplement it. It works by joining msgctx and msgid by '4' byte."""
47 |     key = msgctxt + '\x04' + message
48 |     translation = get_translation().gettext(key)
49 |     return message if translation == key else translation
50 | 
51 | 
52 | def ngettext(message, plural, num):
53 |     return get_translation().ngettext(message, plural, num)
54 | 
55 | 
56 | def gettext_noop(message):
57 |     """Example usage:
58 |     CONSTANTS = [gettext_noop('first'), gettext_noop('second')]
59 |     def num_name(n):
60 |         return gettext(CONSTANTS[n])"""
61 |     return message
62 | 


--------------------------------------------------------------------------------
/humanize/number.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | # -*- coding: utf-8 -*-
  3 | 
  4 | """Humanizing functions for numbers."""
  5 | 
  6 | import re
  7 | from fractions import Fraction
  8 | from .import compat
  9 | from .i18n import gettext as _, gettext_noop as N_, pgettext as P_
 10 | 
 11 | 
 12 | def ordinal(value):
 13 |     """Converts an integer to its ordinal as a string. 1 is '1st', 2 is '2nd',
 14 |     3 is '3rd', etc. Works for any integer or anything int() will turn into an
 15 |     integer.  Anything other value will have nothing done to it."""
 16 |     try:
 17 |         value = int(value)
 18 |     except (TypeError, ValueError):
 19 |         return value
 20 |     t = (P_('0', 'th'),
 21 |          P_('1', 'st'),
 22 |          P_('2', 'nd'),
 23 |          P_('3', 'rd'),
 24 |          P_('4', 'th'),
 25 |          P_('5', 'th'),
 26 |          P_('6', 'th'),
 27 |          P_('7', 'th'),
 28 |          P_('8', 'th'),
 29 |          P_('9', 'th'))
 30 |     if value % 100 in (11, 12, 13):  # special case
 31 |         return "%d%s" % (value, t[0])
 32 |     return '%d%s' % (value, t[value % 10])
 33 | 
 34 | 
 35 | def intcomma(value):
 36 |     """Converts an integer to a string containing commas every three digits.
 37 |     For example, 3000 becomes '3,000' and 45000 becomes '45,000'.  To maintain
 38 |     some compatability with Django's intcomma, this function also accepts
 39 |     floats."""
 40 |     try:
 41 |         if isinstance(value, compat.string_types):
 42 |             float(value.replace(',', ''))
 43 |         else:
 44 |             float(value)
 45 |     except (TypeError, ValueError):
 46 |         return value
 47 |     orig = str(value)
 48 |     new = re.sub("^(-?\d+)(\d{3})", '\g<1>,\g<2>', orig)
 49 |     if orig == new:
 50 |         return new
 51 |     else:
 52 |         return intcomma(new)
 53 | 
 54 | powers = [10 ** x for x in (6, 9, 12, 15, 18, 21, 24, 27, 30, 33, 100)]
 55 | human_powers = (N_('million'), N_('billion'), N_('trillion'), N_('quadrillion'),
 56 |                 N_('quintillion'), N_('sextillion'), N_('septillion'),
 57 |                 N_('octillion'), N_('nonillion'), N_('decillion'), N_('googol'))
 58 | 
 59 | 
 60 | def intword(value, format='%.1f'):
 61 |     """Converts a large integer to a friendly text representation. Works best for
 62 |     numbers over 1 million. For example, 1000000 becomes '1.0 million', 1200000
 63 |     becomes '1.2 million' and '1200000000' becomes '1.2 billion'.  Supports up to
 64 |     decillion (33 digits) and googol (100 digits).  You can pass format to change
 65 |     the number of decimal or general format of the number portion.  This function
 66 |     returns a string unless the value passed was unable to be coaxed into an int."""
 67 |     try:
 68 |         value = int(value)
 69 |     except (TypeError, ValueError):
 70 |         return value
 71 | 
 72 |     if value < powers[0]:
 73 |         return str(value)
 74 |     for ordinal, power in enumerate(powers[1:], 1):
 75 |         if value < power:
 76 |             chopped = value / float(powers[ordinal - 1])
 77 |             return (' '.join([format, _(human_powers[ordinal - 1])])) % chopped
 78 |     return str(value)
 79 | 
 80 | 
 81 | def apnumber(value):
 82 |     """For numbers 1-9, returns the number spelled out. Otherwise, returns the
 83 |     number. This follows Associated Press style.  This always returns a string
 84 |     unless the value was not int-able, unlike the Django filter."""
 85 |     try:
 86 |         value = int(value)
 87 |     except (TypeError, ValueError):
 88 |         return value
 89 |     if not 0 < value < 10:
 90 |         return str(value)
 91 |     return (_('one'), _('two'), _('three'), _('four'), _('five'), _('six'),
 92 |             _('seven'), _('eight'), _('nine'))[value - 1]
 93 | 
 94 | 
 95 | def fractional(value):
 96 |     '''
 97 |     There will be some cases where one might not want to show
 98 |         ugly decimal places for floats and decimals.
 99 |     This function returns a human readable fractional number
100 |         in form of fractions and mixed fractions.
101 |     Pass in a string, or a number or a float, and this function returns
102 |         a string representation of a fraction
103 |         or whole number
104 |         or a mixed fraction
105 |     Examples:
106 |         fractional(0.3) will return '1/3'
107 |         fractional(1.3) will return '1 3/10'
108 |         fractional(float(1/3)) will return '1/3'
109 |         fractional(1) will return '1'
110 |     This will always return a string.
111 |     '''
112 |     try:
113 |         number = float(value)
114 |     except (TypeError, ValueError):
115 |         return value
116 |     wholeNumber = int(number)
117 |     frac = Fraction(number - wholeNumber).limit_denominator(1000)
118 |     numerator = frac._numerator
119 |     denominator = frac._denominator
120 |     if wholeNumber and not numerator and denominator == 1:
121 |         return '%.0f' % wholeNumber  # this means that an integer was passed in (or variants of that integer like 1.0000)
122 |     elif not wholeNumber:
123 |         return '%.0f/%.0f' % (numerator, denominator)
124 |     else:
125 |         return '%.0f %.0f/%.0f' % (wholeNumber, numerator, denominator)
126 | 


--------------------------------------------------------------------------------
/index.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | {% autoescape true %}
 3 | <html>
 4 | <head><title>Atom/RSS to h-feed</title>
 5 | <meta charset="utf-8">
 6 | <meta name="mobile-web-app-capable" content="yes" />
 7 | <link href="styles/hfeed.css" media="all" rel="stylesheet" type="text/css" />
 8 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 9 | <script src="static/fragmention.js"></script>
10 | </head>
11 |   <body>
12 |   <h2>A tool to turn feeds into h-feeds</h2>
13 |     <form action="/feed" method="get">
14 |       <div><input name="feed" type="url"></input></div>
15 |       <div><input type="submit" value="Unmung feed"></div>
16 |       <div><input name="raw" type="checkbox" label="show raw"><label>show raw</label></div>      
17 |     </form>
18 |   <h2>A tool to turn any webpage into mf2 json</h2>
19 |     <form action="/mf2" method="get">
20 |       <div>url:<input name="url" type="url"></input></div>
21 |       <div><textarea name="html" rows="6" cols="80" >{{ rawhtml }}</textarea></div>
22 |       <div><input type="submit" value="parse for microformats"></div>
23 |       <div><input name="pretty" type="checkbox" label="pretty print" checked="on"><label>pretty print</label></div> 
24 |       <div><pre><code>{{mfjson}}</code></pre></div>     
25 |     </form>
26 |   <h2>A tool to autolink and embed urls into html</h2>
27 |     <form action="/autolink" method="get">
28 |       <div><textarea name="rawtext" rows="6" cols="80" >{{ rawtext }}</textarea></div>
29 |       <div><input type="submit" value="autolink"></div>
30 |       <div><input name="embed" type="checkbox" label="pretty print" checked="on"><label>embed images etc</label></div> 
31 |       <div><input name="maxurllength" type="number" label="max url length" ></div> 
32 |       {% autoescape false %}<div>{{ linkedhtml }}</div> {% endautoescape %}    
33 |       <div><textarea name="linkedhtml" rows="6" cols="80" >{{ linkedhtml }}</textarea></div>
34 |     </form>
35 |   <h2>A tool to show indiecards</h2>
36 |     <form action="/indiecard" method="get">
37 |       <div><input name="url" type="url"></input></div>
38 |       <div><input type="submit" value="show indiecard"></div>
39 |     </form>
40 |   <h2>A tool to show storycards</h2>
41 |     <form action="/storycard" method="get">
42 |       <div><input name="url" type="url"></input></div>
43 |       <div><input type="submit" value="show storycards"></div>
44 |     </form>
45 |   <h2>A tool to show json as html</h2>
46 |     <form action="/jsontoxoxo" method="get">
47 |       <div><input name="url" type="url"></input></div>
48 |       <div><input type="submit" value="to html"></div>
49 |     </form>
50 |   <h2>A tool to extract json from html lists</h2>
51 |     <form action="/xoxotojson" method="get">
52 |       <div><input name="url" type="url"></input></div>
53 |       <div><input name="pretty" type="checkbox" label="pretty print" checked="on"><label>pretty print</label></div> 
54 |       <div><input type="submit" value="to json"></div>
55 |     </form>
56 |   <h2>A tool to make jf2 from mf2</h2>
57 |     <form action="/mf2tojs2" method="get">
58 |       <div><input name="url" type="url"></input></div>
59 |       <div><input name="pretty" type="checkbox" label="pretty print" checked="on"><label>pretty print</label></div> 
60 |       <div><input type="submit" value="to jf2"></div>
61 |     </form>
62 |   <h2>mastodon preview</h2>
63 |     <form action="/mastoview" method="get">
64 |       <div><input name="url" type="text"></input></div>
65 |       <div><input name="local" type="checkbox" label="local" checked="on"><label>local only</label></div> 
66 |       <div><input type="submit" value="preview"></div>
67 |     </form>
68 |   </body>
69 | </html>
70 | {% endautoescape %}


--------------------------------------------------------------------------------
/indiecard.html:
--------------------------------------------------------------------------------
 1 | <html>
 2 | <head><title>{% if item %}{{" ".join(item.properties.name)}}{% else %}Indiecard{% endif %}</title>
 3 | <meta charset="utf-8">
 4 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 5 | <link href="styles/hfeed.css" media="all" rel="stylesheet" type="text/css" />
 6 | <link href="styles/indiecard.css" media="all" rel="stylesheet" type="text/css" />
 7 | <script src="static/fragmention.js"></script>
 8 | </head>
 9 | <body>
10 | <header>
11 |       <form action="/indiecard" method="get">
12 |       <input name="url" type="url" placeholder="get card for url" />
13 |       <input type="submit" value="show indiecard" class="hidden"/>
14 |     </form>
15 | </header>
16 | <main>
17 | {% for item in items %}
18 | <div class="{{item.type[0]}} {% if item.type[0]=='h-recipe' %}hrecipe {% endif %}indiecard">
19 | <h1 >{% if item.properties.photo %}
20 | <a class="figure" href="{{url}}"><img src="{{item.properties.photo[0]}}" class="u-photo photo" /></a>
21 | {% elif item.properties.featured %}
22 | <a class="figure" href="{{url}}"><img src="{{item.properties.featured[0]}}" class="u-featured" /></a>
23 | {% endif %}
24 | <a class="u-url p-name fn" href="{{url}}">{{" ".join(item.properties.name)}}</a></h1>
25 | {% if item.properties.author %}
26 |     {% if item.properties.author[0].properties %}
27 |     <h3 class="p-author author h-card">{% if item.properties.author[0].properties.photo %}<img src="{{item.properties.author[0].properties.photo[0]}}" class="u-photo" />{% endif %}{% if item.properties.author[0].properties.url %}<a class="u-url p-name"" href="{{item.properties.author[0].properties.url[0]}}">{{item.properties.author[0].properties.name[0]}}</a>{% else %}{{item.properties.author[0].properties.name[0]}}{% endif %}</h3>
28 |     {% else %}
29 |     <h3 class="p-author author">{{item.properties.author[0]}}</h3>
30 |     {% endif %}
31 | {% endif %}
32 | {% if item.properties.summary %}
33 | <h2 class="p-summary summary">{{" ".join(item.properties.summary)}}</h2>
34 | {% endif %}
35 | {% if item.properties.content %}
36 | <h2 class="e-content">{{" ".join(item.properties.content.html)}}</h2>
37 | {% endif %}
38 | {% if item.properties.ingredient %}
39 | <h3>Ingredients</h3>
40 | <ul>
41 | {% for food in item.properties.ingredient %}<li class="ingredient p-ingredient">{{food}}{% endfor %}
42 | </ul>
43 | {% endif %}
44 | {% if item.properties.instructions %}
45 | <h3>Method</h3>
46 | {% if item.properties.instructions|length ==1 %}
47 | {% autoescape false %}
48 | <p class="instructions p-instructions">{{item.properties.instructions[0]["html"] or item.properties.instructions[0]}}</p>
49 | {% endautoescape %}
50 | {% else %}
51 | <ol>
52 | {% autoescape false %}
53 | {% for stage in item.properties.instructions %}<li class="instructions p-instructions">{{stage["html"] or stage}}{% endfor %}
54 | {% endautoescape %}
55 | </ol>
56 | {% endif %}
57 | {% endif %}
58 | {% if item.properties.note %}
59 | {% if item.properties.note[0].html %}
60 | {% autoescape false %}
61 | <h2 class="e-note">{{item.properties.note[0].html}}</h2>
62 | {% endautoescape %}
63 | {% else %}
64 | <h2 class="p-note">{{" ".join(item.properties.note)}}</h2>
65 | {% endif %}
66 | {% endif %}
67 | </div>
68 | {% endfor %}
69 | </main>
70 | <footer>
71 | {%if items %}<details><summary>raw</summary><code>{{items}}</code></details>{% endif %}
72 | </footer>
73 | </body>
74 | </html>


--------------------------------------------------------------------------------
/instancelist.html:
--------------------------------------------------------------------------------
 1 | <head>
 2 | <link rel="stylesheet" href="styles/awesomplete.css" />
 3 | <script src="/static/awesomplete.min.js" async></script>
 4 | </head>
 5 | <body>
 6 | <form action="/mastoview" method="get">
 7 | <input name="url" class="awesomplete" list="mylist" value="{{domain}}"  data-minchars=1  data-maxitems=20/>
 8 | <datalist id="mylist">
 9 | {% for instance in instances %}
10 | <option>{{instance["name"]}}</option>
11 | {% endfor %}
12 | </datalist>      
13 | <select name="view">
14 |       <option value="local" {% if view=="local" %}selected {% endif %}>Local</option>
15 |       <option value="federated" {% if view=="federated" %}selected {% endif %}>Federated</option>
16 | </select>
17 | <button type="submit" value="preview">Preview</button>
18 | </form>
19 | 


--------------------------------------------------------------------------------
/joyline.svg:
--------------------------------------------------------------------------------
1 | <svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:ev="http://www.w3.org/2001/xml-events" version="1.1" baseProfile="full" width="480" height="{{max}}"  viewBox="0 0 480 {{max}}" >
2 | <style>svg {background-color: black;} polyline {stroke-linejoin:round; stroke:white; stroke-width:3; fill:black;}</style>
3 | {% for line in lines %}
4 | <polyline transform="matrix(1 0 0 -1 0 {{line.down}})" points="{{line.points}}"/>
5 | {% endfor %}
6 | </svg>


--------------------------------------------------------------------------------
/markedup.html:
--------------------------------------------------------------------------------
 1 | <html>
 2 | <head><title>{{name}}</title>
 3 | <meta charset="utf-8">
 4 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 5 | <style>
 6 | body {margin:0; font-size:1.5em; font-family: "Gill Sans", Roboto,Verdana, sans-serif;}
 7 | .markup {    font-family: monospace;
 8 |     color: whitesmoke;
 9 |     background-color: darkslateblue;
10 |     font-size: 1rem;
11 |     text-shadow: -1px 1px 6px #ffc, 1px -1px 6px #fff;}
12 | .humans {font-size:2em; color:black; font-weight:bold;}
13 | img {height:8em;}
14 | .sidebyside {display:flex; justify-content:space-around;align-items:center;}
15 | </style>
16 | </head>
17 | <body>
18 | <div class="markup">
19 | &lt;div class=h-card &gt;&lt;a class=u-url rel=me
20 | <br>href=<span class="humans">{{url}}</span> &gt;
21 | </div>
22 | <div class="sidebyside">
23 | <div class="markup"><br>&lt;img class=u-photo src=
24 | <br><img src="{{photo}}" />/&gt;</div>
25 | <div><span class="humans">{{name}}</span></div>
26 | </div>
27 | <div class="markup">
28 | &lt;/a&gt;&lt/div&gt;
29 | </div>
30 | </body>
31 | </html>


--------------------------------------------------------------------------------
/mf2py/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/mf2py/.DS_Store


--------------------------------------------------------------------------------
/mf2py/__init__.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Microformats2 is a general way to mark up any HTML document with
 3 | classes and propeties. This library parses structured data from
 4 | a microformatted HTML document and returns a well-formed JSON
 5 | dictionary.
 6 | """
 7 | 
 8 | from .version import __version__
 9 | from .parser import Parser, parse
10 | from .mf_helpers import get_url
11 | 
12 | 
13 | __all__ = ['Parser', 'parse', 'get_url', '__version__']
14 | 


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/adr.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "type": [
 3 |         "h-adr"
 4 |     ], 
 5 |     "properties": {
 6 |         "locality": [
 7 |             "p-locality"
 8 |         ], 
 9 |         "region": [
10 |             "p-region"
11 |         ], 
12 |         "extended-address": [
13 |             "p-extended-address"
14 |         ], 
15 |         "post-office-box": [
16 |             "p-post-office-box"
17 |         ], 
18 |         "street-address": [
19 |             "p-street-address"
20 |         ], 
21 |         "postal-code": [
22 |             "p-postal-code"
23 |         ], 
24 |         "country-name": [
25 |             "p-country-name"
26 |         ]
27 |     }
28 | }


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/geo.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "type": [
 3 |         "h-geo"
 4 |     ], 
 5 |     "properties": {
 6 |         "latitude": [
 7 |             "p-latitude"
 8 |         ], 
 9 |         "longitude": [
10 |             "p-longitude"
11 |         ]
12 |     }
13 | }


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/hentry.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "type": [
 3 |         "h-entry"
 4 |     ], 
 5 |     "properties": {
 6 |         "category": [
 7 |             "p-category"
 8 |         ], 
 9 |         "entry-title": [
10 |             "p-name"
11 |         ], 
12 |         "published": [
13 |             "dt-published"
14 |         ], 
15 |         "latitude": [
16 |             "p-latitude"
17 |         ], 
18 |         "entry-content": [
19 |             "e-content"
20 |         ], 
21 |         "entry-summary": [
22 |             "p-summary"
23 |         ], 
24 |         "author": [
25 |             "p-author", 
26 |             "h-card"
27 |         ], 
28 |         "geo": [
29 |             "p-geo", 
30 |             "h-geo"
31 |         ], 
32 |         "updated": [
33 |             "dt-updated"
34 |         ], 
35 |         "longitude": [
36 |             "p-longitude"
37 |         ]
38 |     },
39 |     "rels": {
40 |         "bookmark": [
41 |             "u-url"
42 |         ],
43 |         "tag": [
44 |             "p-category"
45 |         ]
46 |     }
47 | }
48 | 


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/hfeed.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "type": [
 3 |         "h-feed"
 4 |     ], 
 5 |     "properties": {
 6 |         "category": [
 7 |             "p-category"
 8 |         ], 
 9 |         "site-description": [
10 |             "p-summary"
11 |         ], 
12 |         "description": [
13 |             "p-summary"
14 |         ], 
15 |         "site-title": [
16 |             "p-name"
17 |         ], 
18 |         "title": [
19 |             "p-name"
20 |         ]
21 |     },
22 |     "rels": {
23 |         "tag": [
24 |             "p-category"
25 |         ]
26 |     }
27 | }
28 | 


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/hproduct.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "type": [
 3 |         "h-product"
 4 |     ], 
 5 |     "properties": {
 6 |         "category": [
 7 |             "p-category"
 8 |         ], 
 9 |         "price": [
10 |             "p-price"
11 |         ], 
12 |         "description": [
13 |             "p-description"
14 |         ], 
15 |         "url": [
16 |             "u-url"
17 |         ], 
18 |         "photo": [
19 |             "u-photo"
20 |         ], 
21 |         "brand": [
22 |             "p-brand"
23 |         ], 
24 |         "identifier": [
25 |             "u-identifier"
26 |         ], 
27 |         "review": [
28 |             "p-review", 
29 |             "h-review" 
30 |         ], 
31 |         "fn": [
32 |             "p-name"
33 |         ]
34 |     }
35 | }
36 | 


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/hrecipe.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "type": [
 3 |         "h-recipe"
 4 |     ], 
 5 |     "properties": {
 6 |         "nutrition": [
 7 |             "p-nutrition"
 8 |         ], 
 9 |         "yield": [
10 |             "p-yield"
11 |         ], 
12 |         "author": [
13 |             "p-author", 
14 |             "h-card"
15 |         ], 
16 |         "duration": [
17 |             "dt-duration"
18 |         ], 
19 |         "photo": [
20 |             "u-photo"
21 |         ], 
22 |         "instructions": [
23 |             "e-instructions"
24 |         ], 
25 |         "summary": [
26 |             "p-summary"
27 |         ], 
28 |         "fn": [
29 |             "p-name"
30 |         ], 
31 |         "ingredient": [
32 |             "p-ingredient"
33 |         ],
34 |         "category": [
35 |             "p-category"
36 |         ]
37 |     },
38 |     "rels": {
39 |         "tag": [
40 |             "p-category"
41 |         ]
42 |     }
43 | }
44 | 


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/hresume.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "type": [
 3 |         "h-resume"
 4 |     ], 
 5 |     "properties": {
 6 |         "experience": [
 7 |             "h-event", 
 8 |             "p-experience"
 9 |         ], 
10 |         "summary": [
11 |             "p-summary"
12 |         ], 
13 |         "affiliation": [
14 |             "p-affiliation", 
15 |             "h-card"
16 |         ], 
17 |         "contact": [
18 |             "h-card", 
19 |             "p-contact"
20 |         ], 
21 |         "skill": [
22 |             "p-skill"
23 |         ], 
24 |         "education": [
25 |             "h-event", 
26 |             "p-education"
27 |         ]
28 |     }
29 | }


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/hreview-aggregate.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "type": [
 3 |         "h-review-aggregate"
 4 |     ], 
 5 |     "properties": {
 6 |         "rating": [
 7 |             "p-rating"
 8 |         ], 
 9 |         "description": [
10 |             "p-description"
11 |         ], 
12 |         "photo": [
13 |             "u-photo"
14 |         ], 
15 |         "worst": [
16 |             "p-worst"
17 |         ], 
18 |         "reviewer": [
19 |             "p-reviewer", 
20 |             "p-author", 
21 |             "h-card"
22 |         ], 
23 |         "best": [
24 |             "p-best"
25 |         ], 
26 |         "count": [
27 |             "p-count"
28 |         ], 
29 |         "votes": [
30 |             "p-votes"
31 |         ], 
32 |         "dtreviewed": [
33 |             "dt-reviewed"
34 |         ], 
35 |         "url": [
36 |             "u-url"
37 |         ], 
38 |         "summary": [
39 |             "p-name"
40 |         ], 
41 |         "fn": [
42 |             "p-item", 
43 |             "h-item", 
44 |             "p-name"
45 |         ]
46 |     }
47 | }


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/hreview.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "type": [
 3 |         "h-review"
 4 |     ], 
 5 |     "properties": {
 6 |         "rating": [
 7 |             "p-rating"
 8 |         ], 
 9 |         "worst": [
10 |             "p-worst"
11 |         ], 
12 |         "dtreviewed": [
13 |             "dt-reviewed"
14 |         ], 
15 |         "reviewer": [
16 |             "p-author", 
17 |             "h-card"
18 |         ], 
19 |         "url": [
20 |             "p-item", 
21 |             "h-item", 
22 |             "u-url"
23 |         ], 
24 |         "photo": [
25 |             "p-item", 
26 |             "h-item", 
27 |             "u-photo"
28 |         ], 
29 |         "best": [
30 |             "p-best"
31 |         ], 
32 |         "description": [
33 |             "p-description"
34 |         ], 
35 |         "fn": [
36 |             "p-item", 
37 |             "h-item", 
38 |             "p-name"
39 |         ], 
40 |         "summary": [
41 |             "p-name"
42 |         ],
43 |         "item vcard": [
44 |             "p-item",
45 |             "vcard"
46 |         ],
47 |         "item vevent": [
48 |             "p-item",
49 |             "vevent"
50 |         ],
51 |         "item hproduct": [
52 |             "p-item",
53 |             "hproduct"
54 |         ]
55 |     },
56 |     "rels": {
57 |         "self bookmark": [
58 |             "u-url"
59 |         ],
60 |         "tag": [
61 |             "p-category"
62 |         ]
63 |     }
64 | }
65 | 


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/recipe-main-info.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "type": [
 3 |         "h-recipe"
 4 |     ], 
 5 |     "properties": {
 6 |         "content-title__text": ["p-name"],
 7 |         "recipe-ingredients__list-item": ["p-ingredient"],
 8 |         "recipe-metadata__serving": ["p-yield"],
 9 |         "recipe-method-wrapper": ["e-instructions"],
10 |         "recipe-metadata__prep-time": ["p-duration"],
11 |         "nutrition": ["p-nutrition"],
12 |         "recipe-media__image": ["u-photo"],
13 |         "recipe-description__text": ["p-summary"],
14 |         "recipe-ingredients__link":["p-category"],
15 |         "chef": ["p-author", "h-card"],
16 |         "chef__image": ["u-photo"],
17 |         "chef__link": ["p-name"]
18 |     }
19 | 
20 |  }
21 | 


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/vcard.json:
--------------------------------------------------------------------------------
  1 | {
  2 |     "type": [
  3 |         "h-card"
  4 |     ], 
  5 |     "properties": {
  6 |         "tel": [
  7 |             "p-tel"
  8 |         ], 
  9 |         "honorific-suffix": [
 10 |             "p-honorific-suffix"
 11 |         ], 
 12 |         "family-name": [
 13 |             "p-family-name"
 14 |         ], 
 15 |         "photo": [
 16 |             "u-photo"
 17 |         ], 
 18 |         "logo": [
 19 |             "u-logo"
 20 |         ], 
 21 |         "postal-code": [
 22 |             "p-postal-code"
 23 |         ], 
 24 |         "country-name": [
 25 |             "p-country-name"
 26 |         ], 
 27 |         "uid": [
 28 |             "u-uid"
 29 |         ], 
 30 |         "category": [
 31 |             "p-category"
 32 |         ], 
 33 |         "adr": [
 34 |             "p-adr", 
 35 |             "h-adr"
 36 |         ], 
 37 |         "locality": [
 38 |             "p-locality"
 39 |         ], 
 40 |         "nickname": [
 41 |             "p-nickname"
 42 |         ], 
 43 |         "label": [
 44 |             "p-label"
 45 |         ], 
 46 |         "note": [
 47 |             "p-note"
 48 |         ], 
 49 |         "street-address": [
 50 |             "p-street-address"
 51 |         ], 
 52 |         "latitude": [
 53 |             "p-latitude"
 54 |         ], 
 55 |         "email": [
 56 |             "u-email"
 57 |         ], 
 58 |         "bday": [
 59 |             "dt-bday"
 60 |         ], 
 61 |         "extended-address": [
 62 |             "p-extended-address"
 63 |         ], 
 64 |         "additional-name": [
 65 |             "p-additional-name"
 66 |         ], 
 67 |         "organization-unit": [
 68 |             "p-organization-unit"
 69 |         ], 
 70 |         "given-name": [
 71 |             "p-given-name"
 72 |         ], 
 73 |         "key": [
 74 |             "u-key"
 75 |         ], 
 76 |         "org": [
 77 |             "p-org"
 78 |         ], 
 79 |         "honorific-prefix": [
 80 |             "p-honorific-prefix"
 81 |         ], 
 82 |         "geo": [
 83 |             "p-geo", 
 84 |             "h-geo"
 85 |         ], 
 86 |         "fn": [
 87 |             "p-name"
 88 |         ], 
 89 |         "url": [
 90 |             "u-url"
 91 |         ], 
 92 |         "region": [
 93 |             "p-region"
 94 |         ], 
 95 |         "longitude": [
 96 |             "p-longitude"
 97 |         ], 
 98 |         "organization-name": [
 99 |             "p-organization-name"
100 |         ],
101 |         "title": [
102 |             "p-job-title"
103 |         ],
104 |         "role": [
105 |             "p-role"
106 |         ]
107 |     }
108 | }
109 | 


--------------------------------------------------------------------------------
/mf2py/backcompat-rules/vevent.json:
--------------------------------------------------------------------------------
 1 | {
 2 |     "type": [
 3 |         "h-event"
 4 |     ], 
 5 |     "properties": {
 6 |         "attendee": [
 7 |             "p-attendee"
 8 |         ], 
 9 |         "description": [
10 |             "p-description"
11 |         ], 
12 |         "duration": [
13 |             "dt-duration"
14 |         ], 
15 |         "dtend": [
16 |             "dt-end"
17 |         ], 
18 |         "dtstart": [
19 |             "dt-start"
20 |         ], 
21 |         "geo": [
22 |             "p-location h-geo"
23 |         ], 
24 |         "organizer": [
25 |             "p-organizer"
26 |         ], 
27 |         "category": [
28 |             "p-category"
29 |         ], 
30 |         "url": [
31 |             "u-url"
32 |         ], 
33 |         "summary": [
34 |             "p-name"
35 |         ], 
36 |         "contact": [
37 |             "p-contact"
38 |         ], 
39 |         "location": [
40 |             "p-location"
41 |         ]
42 |     }
43 | }


--------------------------------------------------------------------------------
/mf2py/datetime_helpers.py:
--------------------------------------------------------------------------------
 1 | '''helper functions to deal wit datetime strings'''
 2 | from __future__ import unicode_literals, print_function
 3 | 
 4 | import re
 5 | from datetime import datetime
 6 | 
 7 | # REGEX!
 8 | 
 9 | DATE_RE = r'(\d{4}-\d{2}-\d{2})|(\d{4}-\d{3})'
10 | SEC_RE = r'(:(?P<second>\d{2})(\.\d+)?)'
11 | RAWTIME_RE = r'(?P<hour>\d{1,2})(:(?P<minute>\d{2})%s?)?' % (SEC_RE)
12 | AMPM_RE = r'am|pm|a\.m\.|p\.m\.|AM|PM|A\.M\.|P\.M\.'
13 | TIMEZONE_RE = r'Z|[+-]\d{1,2}:?\d{2}?'
14 | TIME_RE = (r'(?P<rawtime>%s)( ?(?P<ampm>%s))?( ?(?P<tz>%s))?' %
15 |            (RAWTIME_RE, AMPM_RE, TIMEZONE_RE))
16 | DATETIME_RE = (r'(?P<date>%s)(?P<separator>[T ])(?P<time>%s)'
17 |                % (DATE_RE, TIME_RE))
18 | 
19 | def normalize_datetime(dtstr, match=None):
20 |         """Try to normalize a datetime string.
21 |         1. Convert 12-hour time to 24-hour time
22 | 
23 |         pass match in if we have already calculated it to avoid rework
24 |         """
25 |         match = match or (dtstr and re.match(DATETIME_RE + '$', dtstr))
26 |         if match:
27 |             datestr = match.group('date')
28 |             hourstr = match.group('hour')
29 |             minutestr = match.group('minute') or '00'
30 |             secondstr = match.group('second')
31 |             ampmstr = match.group('ampm')
32 |             separator = match.group('separator')
33 | 
34 |             # convert ordinal date YYYY-DDD to YYYY-MM-DD
35 |             try:
36 |                 datestr = datetime.strptime(datestr, '%Y-%j').strftime('%Y-%m-%d')
37 |             except ValueError:
38 |                 # datestr was not in YYYY-DDD format
39 |                 pass
40 | 
41 |             # 12 to 24 time conversion
42 |             if ampmstr:
43 |                 hourstr = match.group('hour')
44 |                 hourint = int(hourstr)
45 | 
46 |                 if (ampmstr.startswith('a') or ampmstr.startswith('A')) and hourint == 12:
47 |                     hourstr = '00'
48 | 
49 |                 if (ampmstr.startswith('p') or ampmstr.startswith('P')) and hourint < 12:
50 |                     hourstr = str(hourint + 12)
51 | 
52 | 
53 |             dtstr = '%s%s%s:%s' % (
54 |                 datestr, separator, hourstr, minutestr)
55 | 
56 |             if secondstr:
57 |                 dtstr += ':'+secondstr
58 | 
59 |             tzstr = match.group('tz')
60 |             if tzstr:
61 |                 dtstr += tzstr
62 |         return dtstr
63 | 


--------------------------------------------------------------------------------
/mf2py/mf2_classes.py:
--------------------------------------------------------------------------------
 1 | from __future__ import unicode_literals, print_function
 2 | 
 3 | import re
 4 | 
 5 | _mf2_classes_re = re.compile("(p|e|u|dt|h)-((:?[a-z0-9]+-)?[a-z]+(:?-[a-z]+)*)$")
 6 | _mf2_roots_re = re.compile("h-(:?[a-z0-9]+-)?[a-z]+(:?-[a-z]+)*$")
 7 | _mf2_properties_re = re.compile("(p|e|u|dt)-(:?[a-z0-9]+-)?[a-z]+(:?-[a-z]+)*$")
 8 | _mf2_e_properties_re = re.compile("e-(:?[a-z0-9]+-)?[a-z]+(:?-[a-z]+)*$")
 9 | 
10 | 
11 | def filter_classes(classes, regex=_mf2_classes_re):
12 |     """detect classes that are valid names for mf2, sort in dictionary by prefix"""
13 | 
14 |     types = {x: set() for x in ('u', 'p', 'dt', 'e', 'h')}
15 |     for c in classes:
16 |         match = regex.match(c)
17 |         if match:
18 |             if c[0] == "h":
19 |                 types['h'].add(c)
20 |             else:
21 |                 types[match.group(1)].add(match.group(2))
22 |     return types
23 | 
24 | 
25 | def root(classes):
26 |     return {c for c in classes if _mf2_roots_re.match(c)}
27 | 
28 | def is_property_class(class_):
29 |     return _mf2_properties_re.match(class_)
30 | 
31 | def has_embedded_class(classes):
32 |     return any(_mf2_e_properties_re.match(c) for c in classes)


--------------------------------------------------------------------------------
/mf2py/mf_helpers.py:
--------------------------------------------------------------------------------
 1 | # don't need anymore defer to mf2util instead (mf2util does not have this functionality)
 2 | 
 3 | def get_url(mf):
 4 |     """Given a property value that may be a list of simple URLs or complex
 5 |     h-* dicts (with a url property), extract a list of URLs. This is useful
 6 |     when parsing e.g., in-reply-to.
 7 | 
 8 |     Args:
 9 |       mf (string or dict): URL or h-cite-style dict
10 | 
11 |     Returns:
12 |       list: a list of URLs
13 |     """
14 | 
15 |     urls = []
16 |     for item in mf:
17 |         if isinstance(item, basestring):
18 |             urls.append(item)
19 |         elif (isinstance(item, dict)
20 |               and any(x.startswith('h-') for x in item.get('type', []))):
21 |             urls.extend(item.get('properties', {}).get('url', []))
22 | 
23 |     return urls
24 | 
25 | def unordered_list(l):
26 |     """given a list, returns another list with unique and alphabetically sorted elements.
27 |     use for HTML attributes that have no semantics to their order e.g. class, rel.
28 |     """
29 |     return sorted(set(l))
30 | 


--------------------------------------------------------------------------------
/mf2py/parse_property.py:
--------------------------------------------------------------------------------
  1 | """functions to parse the properties of elements"""
  2 | from __future__ import unicode_literals, print_function
  3 | 
  4 | from .dom_helpers import get_attr, get_img_src_alt, get_textContent, try_urljoin
  5 | from .datetime_helpers import normalize_datetime, DATETIME_RE, TIME_RE
  6 | from . import value_class_pattern
  7 | 
  8 | import sys
  9 | import re
 10 | 
 11 | if sys.version < '3':
 12 |     text_type = unicode
 13 |     binary_type = str
 14 | else:
 15 |     text_type = str
 16 |     binary_type = bytes
 17 | 
 18 | def text(el, base_url=''):
 19 |     """Process p-* properties"""
 20 | 
 21 |     # handle value-class-pattern
 22 |     prop_value = value_class_pattern.text(el)
 23 |     if prop_value is not None:
 24 |         return prop_value
 25 | 
 26 |     prop_value = get_attr(el, "title", check_name=("abbr", "link"))
 27 |     if prop_value is None:
 28 |         prop_value = get_attr(el, "value", check_name=("data", "input"))
 29 |     if prop_value is None:
 30 |         prop_value = get_attr(el, "alt", check_name=("img", "area"))
 31 |     if prop_value is None:
 32 |         prop_value = get_textContent(el, replace_img=True, base_url=base_url)
 33 | 
 34 |     return prop_value
 35 | 
 36 | 
 37 | def url(el, dict_class, img_with_alt, base_url=''):
 38 |     """Process u-* properties"""
 39 | 
 40 |     prop_value = get_attr(el, "href", check_name=("a", "area", "link"))
 41 |     if prop_value is None:
 42 |         prop_value = get_img_src_alt(el, dict_class, img_with_alt, base_url)
 43 |         if prop_value is not None:
 44 |             return prop_value
 45 |     if prop_value is None:
 46 |         prop_value = get_attr(el, "src", check_name=("audio", "video", "source", "iframe"))
 47 |     if prop_value is None:
 48 |         prop_value = get_attr(el, "poster", check_name="video")
 49 |     if prop_value is None:
 50 |         prop_value = get_attr(el, "data", check_name="object")
 51 | 
 52 |     if prop_value is None:
 53 |         # handle value-class-pattern
 54 |         prop_value = value_class_pattern.text(el)
 55 | 
 56 |     if prop_value is None:
 57 |         prop_value = get_attr(el, "title", check_name="abbr")
 58 |     if prop_value is None:
 59 |         prop_value = get_attr(el, "value", check_name=("data", "input"))
 60 |     if prop_value is None:
 61 |         prop_value = get_textContent(el)
 62 | 
 63 |     return try_urljoin(base_url, prop_value)
 64 | 
 65 | 
 66 | def datetime(el, default_date=None):
 67 |     """Process dt-* properties
 68 | 
 69 |     Args:
 70 |       el (bs4.element.Tag): Tag containing the dt-value
 71 | 
 72 |     Returns:
 73 |       a tuple (string string): a tuple of two strings, (datetime, date)
 74 |     """
 75 | 
 76 |     # handle value-class-pattern
 77 |     prop_value = value_class_pattern.datetime(el, default_date)
 78 |     if prop_value is not None:
 79 |         return prop_value
 80 | 
 81 |     prop_value = get_attr(el, "datetime", check_name=("time", "ins", "del"))
 82 |     if prop_value is None:
 83 |         prop_value = get_attr(el, "title", check_name="abbr")
 84 |     if prop_value is None:
 85 |         prop_value = get_attr(el, "value", check_name=("data", "input"))
 86 |     if prop_value is None:
 87 |         prop_value = get_textContent(el) 
 88 | 
 89 |     # if this is just a time, augment with default date
 90 |     match = re.match(TIME_RE + '$', prop_value)
 91 |     if match and default_date:
 92 |         prop_value = '%s %s' % (default_date, prop_value)
 93 |         return normalize_datetime(prop_value), default_date
 94 | 
 95 |     # otherwise, treat it as a full date
 96 |     match = re.match(DATETIME_RE + '$', prop_value)
 97 |     return (normalize_datetime(prop_value, match=match),
 98 |             match and match.group('date'),)
 99 | 
100 | 
101 | def embedded(el, base_url=''):
102 |     """Process e-* properties"""
103 |     return {
104 |         'html': el.decode_contents().strip(),    # secret bs4 method to get innerHTML
105 |         'value': get_textContent(el, replace_img=True, base_url=base_url)
106 |     }
107 | 


--------------------------------------------------------------------------------
/mf2py/temp_fixes.py:
--------------------------------------------------------------------------------
1 | def rm_templates(doc):
2 |     for el in doc.find_all('template'):
3 |         el.extract()
4 | 


--------------------------------------------------------------------------------
/mf2py/value_class_pattern.py:
--------------------------------------------------------------------------------
 1 | """functions to parse the properties of elements according to the value class pattern http://microformats.org/wiki/value-class-pattern """
 2 | 
 3 | from __future__ import unicode_literals, print_function
 4 | 
 5 | from .dom_helpers import get_children
 6 | from .datetime_helpers import normalize_datetime, DATETIME_RE, TIME_RE, DATE_RE, TIMEZONE_RE
 7 | 
 8 | import re
 9 | 
10 | def _get_vcp_value(el):
11 |     if 'value-title' in el.get('class', []):
12 |         return el.get('title')
13 |     return el.get_text()
14 | 
15 | 
16 | def _get_vcp_children(el):
17 |     return [c for c in get_children(el) if c.has_attr('class')
18 |             and ('value' in c['class'] or 'value-title' in c['class'])]
19 | 
20 | def text(el):
21 | 
22 |     value_els = _get_vcp_children(el)
23 |     if value_els:
24 |         return ''.join(_get_vcp_value(el) for el in value_els)
25 | 
26 | 
27 | def datetime(el, default_date=None):
28 | 
29 |     value_els = _get_vcp_children(el)
30 |     if value_els:
31 |         date_parts = []
32 |         for value_el in value_els:
33 |             if 'value-title' in value_el.get('class', []):
34 |                 title = el.get('title')
35 |                 if title:
36 |                     date_parts.append(title.strip())
37 |             elif value_el.name in ('img', 'area'):
38 |                 alt = value_el.get('alt') or value_el.get_text()
39 |                 if alt:
40 |                     date_parts.append(alt.strip())
41 |             elif value_el.name == 'data':
42 |                 val = value_el.get('value') or value_el.get_text()
43 |                 if val:
44 |                     date_parts.append(val.strip())
45 |             elif value_el.name == 'abbr':
46 |                 title = value_el.get('title') or value_el.get_text()
47 |                 if title:
48 |                     date_parts.append(title.strip())
49 |             elif value_el.name in ('del', 'ins', 'time'):
50 |                 dt = value_el.get('datetime') or value_el.get_text()
51 |                 if dt:
52 |                     date_parts.append(dt.strip())
53 |             else:
54 |                 val = value_el.get_text()
55 |                 if val:
56 |                     date_parts.append(val.strip())
57 | 
58 |         date_part = time_part = tz_part = None
59 | 
60 |         for part in date_parts:
61 |             match = re.match(DATETIME_RE + '$', part)
62 |             if match:
63 |                 # if it's a full datetime, then we're done
64 |                 date_part = match.group('date')
65 |                 return normalize_datetime(part, match=match), date_part
66 | 
67 |             # only use first found value
68 |             if re.match(TIME_RE + '$', part) and time_part is None:
69 |                 time_part = part
70 |             elif re.match(DATE_RE + '$', part) and date_part is None:
71 |                 date_part = part
72 |             elif re.match(TIMEZONE_RE + '$', part) and tz_part is None:
73 |                 tz_part = part
74 | 
75 |         # use default date
76 |         if date_part is None:
77 |             date_part = default_date
78 | 
79 |         if date_part and time_part:
80 |             date_time_value = '%s %s' % (date_part,
81 |                                          time_part)
82 |         else:
83 |             date_time_value = date_part or time_part
84 | 
85 |         if tz_part:
86 |             date_time_value += tz_part
87 | 
88 |         return normalize_datetime(date_time_value), date_part
89 | 
90 | 


--------------------------------------------------------------------------------
/mf2py/version.py:
--------------------------------------------------------------------------------
1 | # Define the version number. This class is exec'd by setup.py to read
2 | # the value without loading mf2py (loading mf2py is bad if its dependencies
3 | # haven't been installed yet, which is common during setup)
4 | __version__ = '1.1.2'
5 | 


--------------------------------------------------------------------------------
/mf2tojf2.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | # -*- coding: utf-8 -*-
 3 | # mf2 to jf2 converter
 4 | # licence cc0
 5 | #  2015 Kevin Marks
 6 | 
 7 | import logging
 8 | 
 9 | 
10 | def flattenProperties(items):
11 |     if type(items) is list:
12 |         if len(items) <1:
13 |             return {}
14 |         if len(items)== 1:
15 |             item = items[0]    
16 |             if type(item) is dict:
17 |                 if item.has_key("type"):
18 |                     props ={"type":'-'.join(item.get("type",["-"])[0].split("-")[1:])}
19 |                     properties =  item.get("properties",{})
20 |                     for prop in properties:
21 |                         props[prop] = flattenProperties(properties[prop])
22 |                     children  =  item.get("children",[])
23 |                     if children:
24 |                         if len(children) == 1:
25 |                             props["children"] =[flattenProperties(children)]
26 |                         else:
27 |                             props["children"] =flattenProperties(children)["children"]
28 |                     return props
29 |                
30 |                 elif item.has_key("value"):
31 |                     return item["value"]
32 |                 else:
33 |                     return ''
34 |             else:
35 |                 return item
36 |         else:
37 |             return {"children":[flattenProperties([child]) for child in items]}
38 |     else:
39 |         return items #not a list, so string
40 |     
41 | 
42 | def mf2tojf2(mf2):
43 |     """I'm going to have to recurse here"""
44 |     jf2={}
45 |     items = mf2.get("items",[])
46 |     jf2=flattenProperties(items)
47 |     #print jf2
48 |     return jf2


--------------------------------------------------------------------------------
/oembedcard.html:
--------------------------------------------------------------------------------
 1 | <style>
 2 | .indiecard {font-family: "Gill Sans", Roboto,Verdana, sans-serif;
 3 |              display: -webkit-flex; display:flex;
 4 |             -webkit-flex-direction: column; flex-direction: column;
 5 |             -webkit-align-items: stretch; align-items: stretch;
 6 |             margin:0; width:100%; height:100%; padding: 0; overflow:hidden;
 7 |             font-size:3vw;
 8 |             }
 9 | .u-banner {height:30vh;}
10 | .u-banner img {width:100%; height:100%; object-fit: cover;}
11 | h1 {display: -webkit-flex; display:flex; 
12 |     -webkit-align-items:center; align-items:center;
13 |     font-size:20vh; margin:0;height:25vh;
14 |     }
15 | text {font-size:20vh;}
16 | a { text-decoration:none;}
17 | .figure {-webkit-flex-grow:1; flex-grow:1;  max-width:20%; height:100%;}
18 | .u-photo {width:100%; max-height:100%; object-fit: contain;
19 |         }
20 | .p-name {-webkit-flex-grow:4; flex-grow:4; } 
21 | h2 { 
22 |     font-weight: 300; margin:0; 
23 |     font-size:6vw;
24 |     }
25 | .h-entry {margin-left: 10vw; margin-bottom:4vh;}
26 | h3 { 
27 |     font-weight: 400; margin:0; 
28 |     font-size:7vh;
29 |     text-overflow: ellipsis;
30 |     overflow: hidden;
31 |     max-height:16vh;
32 |     }
33 | p { margin:0;}
34 | </style>
35 | <div class="{{type}} indiecard">
36 | {% if banner %}
37 | <div class="u-featured">
38 | <img src={{banner}} />
39 | </div>
40 | {% endif %}
41 | <h1 >{% if photo %}
42 | <a class="figure" href="{{url}}"><img src="{{photo}}" class="u-photo" /></a>
43 | {% endif %}
44 | <a class="u-url p-name" href="{{url}}">
45 | <svg width="100%" height="100%"><text x="0%"  y="80%" font-size="30vh"  textLength="100%" lengthAdjust="spacingAndGlyphs">{{name}}</text></svg>
46 | </a></h1>
47 | {% if summary %}
48 | {% autoescape false %}
49 | <h2 class="e-summary">{{summary}}</h2>
50 | {% endautoescape  %}
51 | {% endif %}
52 | {% if org %}
53 | {% autoescape false %}
54 | <h3 class="p-org h-card">{{org}}</h3>
55 | {% endautoescape  %}
56 | {% endif %}
57 | 
58 | {% if entries %}
59 | {% for entry in entries %}
60 | <div class="h-entry"><a href="{{entry.url}}"><h3 class="e-name">{{entry.name}}</h3></a>
61 | {% if entry.featured %}
62 | <img class="u-featured" src="{{entry.featured}}" />
63 | {% elif  entry.photo %}
64 | <img class="u-photo" src="{{entry.photo}}" />
65 | {% endif %}
66 | <p class="e-summary">{{entry.summary}}</p>
67 | </div>
68 | {% endfor %}
69 | {% endif %}
70 | </div>
71 | 


--------------------------------------------------------------------------------
/openanything.py:
--------------------------------------------------------------------------------
  1 | '''OpenAnything: a kind and thoughtful library for HTTP web services
  2 | This program is part of 'Dive Into Python', a free Python book for
  3 | experienced programmers.  Visit http://diveintopython.org/ for the
  4 | latest version.
  5 | '''
  6 | 
  7 | __author__ = 'Mark Pilgrim (mark@diveintopython.org)'
  8 | __version__ = '$Revision: 1.6 $'[11:-2]
  9 | __date__ = '$Date: 2004/04/16 21:16:24 $'
 10 | __copyright__ = 'Copyright (c) 2004 Mark Pilgrim'
 11 | __license__ = 'Python'
 12 | 
 13 | import urllib2, urlparse, gzip
 14 | from StringIO import StringIO
 15 | import logging
 16 | 
 17 | 
 18 | USER_AGENT = 'OpenAnything/%s +http://diveintopython.org/http_web_services/' % __version__
 19 | 
 20 | class SmartRedirectHandler(urllib2.HTTPRedirectHandler):
 21 |     def http_error_301(self, req, fp, code, msg, headers):
 22 |         result = urllib2.HTTPRedirectHandler.http_error_301(
 23 |             self, req, fp, code, msg, headers)
 24 |         result.status = code
 25 |         logging.info("http_error_301: - for '%s'"  % (req.get_full_url()))
 26 |         return result
 27 | 
 28 |     def http_error_302(self, req, fp, code, msg, headers):
 29 |         result = urllib2.HTTPRedirectHandler.http_error_302(
 30 |             self, req, fp, code, msg, headers)
 31 |         result.status = code
 32 |         logging.info("http_error_302: - for '%s'"  % (req.get_full_url()))
 33 |         return result
 34 | 
 35 | class DefaultErrorHandler(urllib2.HTTPDefaultErrorHandler):
 36 |     def http_error_default(self, req, fp, code, msg, headers):
 37 |         result = urllib2.HTTPError(
 38 |             req.get_full_url(), code, msg, headers, fp)
 39 |         result.status = code
 40 |         logging.info("http_error_default: %s - for '%s'"  % (str(code),req.get_full_url()))
 41 |         return result
 42 | 
 43 | def openAnything(source, etag=None, lastmodified=None, agent=USER_AGENT):
 44 |     """URL, filename, or string --> stream
 45 |     This function lets you define parsers that take any input source
 46 |     (URL, pathname to local or network file, or actual data as a string)
 47 |     and deal with it in a uniform manner.  Returned object is guaranteed
 48 |     to have all the basic stdio read methods (read, readline, readlines).
 49 |     Just .close() the object when you're done with it.
 50 |     If the etag argument is supplied, it will be used as the value of an
 51 |     If-None-Match request header.
 52 |     If the lastmodified argument is supplied, it must be a formatted
 53 |     date/time string in GMT (as returned in the Last-Modified header of
 54 |     a previous request).  The formatted date/time will be used
 55 |     as the value of an If-Modified-Since request header.
 56 |     If the agent argument is supplied, it will be used as the value of a
 57 |     User-Agent request header.
 58 |     """
 59 |     logging.info("openAnything:  '%s'"  % (str(source)))
 60 | 
 61 |     if hasattr(source, 'read'):
 62 |         return source
 63 | 
 64 |     if source == '-':
 65 |         return sys.stdin
 66 | 
 67 |     if urlparse.urlparse(source)[0][:4] == 'http':
 68 |         # open URL with urllib2
 69 |         request = urllib2.Request(source)
 70 |         request.add_header('User-Agent', agent)
 71 |         if lastmodified:
 72 |             request.add_header('If-Modified-Since', lastmodified)
 73 |         if etag:
 74 |             request.add_header('If-None-Match', etag)
 75 |         request.add_header('Accept-encoding', 'gzip')
 76 |         opener = urllib2.build_opener(SmartRedirectHandler(), DefaultErrorHandler())
 77 |         return opener.open(request)
 78 |     
 79 |     # try to open with native open function (if source is a filename)
 80 |     try:
 81 |         return open(source)
 82 |     except (IOError, OSError):
 83 |         pass
 84 | 
 85 |     # treat source as string
 86 |     return StringIO(str(source))
 87 | 
 88 | def fetch(source, etag=None, lastmodified=None, agent=USER_AGENT):
 89 |     '''Fetch data and metadata from a URL, file, stream, or string'''
 90 |     result = {}
 91 |     f = openAnything(source, etag, lastmodified, agent)
 92 |     result['data'] = f.read()
 93 |     if hasattr(f, 'headers'):
 94 |         # save ETag, if the server sent one
 95 |         result['etag'] = f.headers.get('ETag')
 96 |         # save Last-Modified header, if the server sent one
 97 |         result['lastmodified'] = f.headers.get('Last-Modified')
 98 |         if f.headers.get('content-encoding') == 'gzip':
 99 |             # data came back gzip-compressed, decompress it
100 |             result['data'] = gzip.GzipFile(fileobj=StringIO(result['data'])).read()
101 |     if hasattr(f, 'url'):
102 |         result['url'] = f.geturl()
103 |         result['status'] = 200
104 |     if hasattr(f, 'status'):
105 |         result['status'] = f.status
106 |     f.close()
107 |     return result


--------------------------------------------------------------------------------
/queue.yaml:
--------------------------------------------------------------------------------
1 | queue:
2 | - name: default
3 |   max_concurrent_requests: 1
4 |   rate: 5/s


--------------------------------------------------------------------------------
/requests/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/requests/.DS_Store


--------------------------------------------------------------------------------
/requests/__init__.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | 
 3 | #   __
 4 | #  /__)  _  _     _   _ _/   _
 5 | # / (   (- (/ (/ (- _)  /  _)
 6 | #          /
 7 | 
 8 | """
 9 | requests HTTP library
10 | ~~~~~~~~~~~~~~~~~~~~~
11 | 
12 | Requests is an HTTP library, written in Python, for human beings. Basic GET
13 | usage:
14 | 
15 |    >>> import requests
16 |    >>> r = requests.get('https://www.python.org')
17 |    >>> r.status_code
18 |    200
19 |    >>> 'Python is a programming language' in r.content
20 |    True
21 | 
22 | ... or POST:
23 | 
24 |    >>> payload = dict(key1='value1', key2='value2')
25 |    >>> r = requests.post('http://httpbin.org/post', data=payload)
26 |    >>> print(r.text)
27 |    {
28 |      ...
29 |      "form": {
30 |        "key2": "value2",
31 |        "key1": "value1"
32 |      },
33 |      ...
34 |    }
35 | 
36 | The other HTTP methods are supported - see `requests.api`. Full documentation
37 | is at <http://python-requests.org>.
38 | 
39 | :copyright: (c) 2015 by Kenneth Reitz.
40 | :license: Apache 2.0, see LICENSE for more details.
41 | 
42 | """
43 | 
44 | __title__ = 'requests'
45 | __version__ = '2.7.0'
46 | __build__ = 0x020700
47 | __author__ = 'Kenneth Reitz'
48 | __license__ = 'Apache 2.0'
49 | __copyright__ = 'Copyright 2015 Kenneth Reitz'
50 | 
51 | # Attempt to enable urllib3's SNI support, if possible
52 | try:
53 |     from .packages.urllib3.contrib import pyopenssl
54 |     pyopenssl.inject_into_urllib3()
55 | except ImportError:
56 |     pass
57 | 
58 | from . import utils
59 | from .models import Request, Response, PreparedRequest
60 | from .api import request, get, head, post, patch, put, delete, options
61 | from .sessions import session, Session
62 | from .status_codes import codes
63 | from .exceptions import (
64 |     RequestException, Timeout, URLRequired,
65 |     TooManyRedirects, HTTPError, ConnectionError
66 | )
67 | 
68 | # Set default logging handler to avoid "No handler found" warnings.
69 | import logging
70 | try:  # Python 2.7+
71 |     from logging import NullHandler
72 | except ImportError:
73 |     class NullHandler(logging.Handler):
74 |         def emit(self, record):
75 |             pass
76 | 
77 | logging.getLogger(__name__).addHandler(NullHandler())
78 | 


--------------------------------------------------------------------------------
/requests/certs.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | # -*- coding: utf-8 -*-
 3 | 
 4 | """
 5 | certs.py
 6 | ~~~~~~~~
 7 | 
 8 | This module returns the preferred default CA certificate bundle.
 9 | 
10 | If you are packaging Requests, e.g., for a Linux distribution or a managed
11 | environment, you can change the definition of where() to return a separately
12 | packaged CA bundle.
13 | """
14 | import os.path
15 | 
16 | try:
17 |     from certifi import where
18 | except ImportError:
19 |     def where():
20 |         """Return the preferred certificate bundle."""
21 |         # vendored bundle inside Requests
22 |         return os.path.join(os.path.dirname(__file__), 'cacert.pem')
23 | 
24 | if __name__ == '__main__':
25 |     print(where())
26 | 


--------------------------------------------------------------------------------
/requests/compat.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | 
 3 | """
 4 | pythoncompat
 5 | """
 6 | 
 7 | from .packages import chardet
 8 | 
 9 | import sys
10 | 
11 | # -------
12 | # Pythons
13 | # -------
14 | 
15 | # Syntax sugar.
16 | _ver = sys.version_info
17 | 
18 | #: Python 2.x?
19 | is_py2 = (_ver[0] == 2)
20 | 
21 | #: Python 3.x?
22 | is_py3 = (_ver[0] == 3)
23 | 
24 | try:
25 |     import simplejson as json
26 | except (ImportError, SyntaxError):
27 |     # simplejson does not support Python 3.2, it throws a SyntaxError
28 |     # because of u'...' Unicode literals.
29 |     import json
30 | 
31 | # ---------
32 | # Specifics
33 | # ---------
34 | 
35 | if is_py2:
36 |     from urllib import quote, unquote, quote_plus, unquote_plus, urlencode, getproxies, proxy_bypass
37 |     from urlparse import urlparse, urlunparse, urljoin, urlsplit, urldefrag
38 |     from urllib2 import parse_http_list
39 |     import cookielib
40 |     from Cookie import Morsel
41 |     from StringIO import StringIO
42 |     from .packages.urllib3.packages.ordered_dict import OrderedDict
43 | 
44 |     builtin_str = str
45 |     bytes = str
46 |     str = unicode
47 |     basestring = basestring
48 |     numeric_types = (int, long, float)
49 | 
50 | elif is_py3:
51 |     from urllib.parse import urlparse, urlunparse, urljoin, urlsplit, urlencode, quote, unquote, quote_plus, unquote_plus, urldefrag
52 |     from urllib.request import parse_http_list, getproxies, proxy_bypass
53 |     from http import cookiejar as cookielib
54 |     from http.cookies import Morsel
55 |     from io import StringIO
56 |     from collections import OrderedDict
57 | 
58 |     builtin_str = str
59 |     str = str
60 |     bytes = bytes
61 |     basestring = (str, bytes)
62 |     numeric_types = (int, float)
63 | 


--------------------------------------------------------------------------------
/requests/exceptions.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | 
  3 | """
  4 | requests.exceptions
  5 | ~~~~~~~~~~~~~~~~~~~
  6 | 
  7 | This module contains the set of Requests' exceptions.
  8 | 
  9 | """
 10 | from .packages.urllib3.exceptions import HTTPError as BaseHTTPError
 11 | 
 12 | 
 13 | class RequestException(IOError):
 14 |     """There was an ambiguous exception that occurred while handling your
 15 |     request."""
 16 | 
 17 |     def __init__(self, *args, **kwargs):
 18 |         """
 19 |         Initialize RequestException with `request` and `response` objects.
 20 |         """
 21 |         response = kwargs.pop('response', None)
 22 |         self.response = response
 23 |         self.request = kwargs.pop('request', None)
 24 |         if (response is not None and not self.request and
 25 |                 hasattr(response, 'request')):
 26 |             self.request = self.response.request
 27 |         super(RequestException, self).__init__(*args, **kwargs)
 28 | 
 29 | 
 30 | class HTTPError(RequestException):
 31 |     """An HTTP error occurred."""
 32 | 
 33 | 
 34 | class ConnectionError(RequestException):
 35 |     """A Connection error occurred."""
 36 | 
 37 | 
 38 | class ProxyError(ConnectionError):
 39 |     """A proxy error occurred."""
 40 | 
 41 | 
 42 | class SSLError(ConnectionError):
 43 |     """An SSL error occurred."""
 44 | 
 45 | 
 46 | class Timeout(RequestException):
 47 |     """The request timed out.
 48 | 
 49 |     Catching this error will catch both
 50 |     :exc:`~requests.exceptions.ConnectTimeout` and
 51 |     :exc:`~requests.exceptions.ReadTimeout` errors.
 52 |     """
 53 | 
 54 | 
 55 | class ConnectTimeout(ConnectionError, Timeout):
 56 |     """The request timed out while trying to connect to the remote server.
 57 | 
 58 |     Requests that produced this error are safe to retry.
 59 |     """
 60 | 
 61 | 
 62 | class ReadTimeout(Timeout):
 63 |     """The server did not send any data in the allotted amount of time."""
 64 | 
 65 | 
 66 | class URLRequired(RequestException):
 67 |     """A valid URL is required to make a request."""
 68 | 
 69 | 
 70 | class TooManyRedirects(RequestException):
 71 |     """Too many redirects."""
 72 | 
 73 | 
 74 | class MissingSchema(RequestException, ValueError):
 75 |     """The URL schema (e.g. http or https) is missing."""
 76 | 
 77 | 
 78 | class InvalidSchema(RequestException, ValueError):
 79 |     """See defaults.py for valid schemas."""
 80 | 
 81 | 
 82 | class InvalidURL(RequestException, ValueError):
 83 |     """ The URL provided was somehow invalid. """
 84 | 
 85 | 
 86 | class ChunkedEncodingError(RequestException):
 87 |     """The server declared chunked encoding but sent an invalid chunk."""
 88 | 
 89 | 
 90 | class ContentDecodingError(RequestException, BaseHTTPError):
 91 |     """Failed to decode response content"""
 92 | 
 93 | 
 94 | class StreamConsumedError(RequestException, TypeError):
 95 |     """The content for this response was already consumed"""
 96 | 
 97 | 
 98 | class RetryError(RequestException):
 99 |     """Custom retries logic failed"""
100 | 


--------------------------------------------------------------------------------
/requests/hooks.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | 
 3 | """
 4 | requests.hooks
 5 | ~~~~~~~~~~~~~~
 6 | 
 7 | This module provides the capabilities for the Requests hooks system.
 8 | 
 9 | Available hooks:
10 | 
11 | ``response``:
12 |     The response generated from a Request.
13 | 
14 | """
15 | 
16 | 
17 | HOOKS = ['response']
18 | 
19 | 
20 | def default_hooks():
21 |     hooks = {}
22 |     for event in HOOKS:
23 |         hooks[event] = []
24 |     return hooks
25 | 
26 | # TODO: response is the only one
27 | 
28 | 
29 | def dispatch_hook(key, hooks, hook_data, **kwargs):
30 |     """Dispatches a hook dictionary on a given piece of data."""
31 | 
32 |     hooks = hooks or dict()
33 | 
34 |     if key in hooks:
35 |         hooks = hooks.get(key)
36 | 
37 |         if hasattr(hooks, '__call__'):
38 |             hooks = [hooks]
39 | 
40 |         for hook in hooks:
41 |             _hook_data = hook(hook_data, **kwargs)
42 |             if _hook_data is not None:
43 |                 hook_data = _hook_data
44 | 
45 |     return hook_data
46 | 


--------------------------------------------------------------------------------
/requests/packages/__init__.py:
--------------------------------------------------------------------------------
1 | from __future__ import absolute_import
2 | 
3 | from . import urllib3
4 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/__init__.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # This library is free software; you can redistribute it and/or
 3 | # modify it under the terms of the GNU Lesser General Public
 4 | # License as published by the Free Software Foundation; either
 5 | # version 2.1 of the License, or (at your option) any later version.
 6 | #
 7 | # This library is distributed in the hope that it will be useful,
 8 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
 9 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
10 | # Lesser General Public License for more details.
11 | #
12 | # You should have received a copy of the GNU Lesser General Public
13 | # License along with this library; if not, write to the Free Software
14 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
15 | # 02110-1301  USA
16 | ######################### END LICENSE BLOCK #########################
17 | 
18 | __version__ = "2.3.0"
19 | from sys import version_info
20 | 
21 | 
22 | def detect(aBuf):
23 |     if ((version_info < (3, 0) and isinstance(aBuf, unicode)) or
24 |             (version_info >= (3, 0) and not isinstance(aBuf, bytes))):
25 |         raise ValueError('Expected a bytes object, not a unicode object')
26 | 
27 |     from . import universaldetector
28 |     u = universaldetector.UniversalDetector()
29 |     u.reset()
30 |     u.feed(aBuf)
31 |     u.close()
32 |     return u.result
33 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/big5prober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is Mozilla Communicator client code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 1998
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #
12 | # This library is free software; you can redistribute it and/or
13 | # modify it under the terms of the GNU Lesser General Public
14 | # License as published by the Free Software Foundation; either
15 | # version 2.1 of the License, or (at your option) any later version.
16 | #
17 | # This library is distributed in the hope that it will be useful,
18 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
19 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20 | # Lesser General Public License for more details.
21 | #
22 | # You should have received a copy of the GNU Lesser General Public
23 | # License along with this library; if not, write to the Free Software
24 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25 | # 02110-1301  USA
26 | ######################### END LICENSE BLOCK #########################
27 | 
28 | from .mbcharsetprober import MultiByteCharSetProber
29 | from .codingstatemachine import CodingStateMachine
30 | from .chardistribution import Big5DistributionAnalysis
31 | from .mbcssm import Big5SMModel
32 | 
33 | 
34 | class Big5Prober(MultiByteCharSetProber):
35 |     def __init__(self):
36 |         MultiByteCharSetProber.__init__(self)
37 |         self._mCodingSM = CodingStateMachine(Big5SMModel)
38 |         self._mDistributionAnalyzer = Big5DistributionAnalysis()
39 |         self.reset()
40 | 
41 |     def get_charset_name(self):
42 |         return "Big5"
43 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/chardetect.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | """
 3 | Script which takes one or more file paths and reports on their detected
 4 | encodings
 5 | 
 6 | Example::
 7 | 
 8 |     % chardetect somefile someotherfile
 9 |     somefile: windows-1252 with confidence 0.5
10 |     someotherfile: ascii with confidence 1.0
11 | 
12 | If no paths are provided, it takes its input from stdin.
13 | 
14 | """
15 | 
16 | from __future__ import absolute_import, print_function, unicode_literals
17 | 
18 | import argparse
19 | import sys
20 | from io import open
21 | 
22 | from chardet import __version__
23 | from chardet.universaldetector import UniversalDetector
24 | 
25 | 
26 | def description_of(lines, name='stdin'):
27 |     """
28 |     Return a string describing the probable encoding of a file or
29 |     list of strings.
30 | 
31 |     :param lines: The lines to get the encoding of.
32 |     :type lines: Iterable of bytes
33 |     :param name: Name of file or collection of lines
34 |     :type name: str
35 |     """
36 |     u = UniversalDetector()
37 |     for line in lines:
38 |         u.feed(line)
39 |     u.close()
40 |     result = u.result
41 |     if result['encoding']:
42 |         return '{0}: {1} with confidence {2}'.format(name, result['encoding'],
43 |                                                      result['confidence'])
44 |     else:
45 |         return '{0}: no result'.format(name)
46 | 
47 | 
48 | def main(argv=None):
49 |     '''
50 |     Handles command line arguments and gets things started.
51 | 
52 |     :param argv: List of arguments, as if specified on the command-line.
53 |                  If None, ``sys.argv[1:]`` is used instead.
54 |     :type argv: list of str
55 |     '''
56 |     # Get command line arguments
57 |     parser = argparse.ArgumentParser(
58 |         description="Takes one or more file paths and reports their detected \
59 |                      encodings",
60 |         formatter_class=argparse.ArgumentDefaultsHelpFormatter,
61 |         conflict_handler='resolve')
62 |     parser.add_argument('input',
63 |                         help='File whose encoding we would like to determine.',
64 |                         type=argparse.FileType('rb'), nargs='*',
65 |                         default=[sys.stdin])
66 |     parser.add_argument('--version', action='version',
67 |                         version='%(prog)s {0}'.format(__version__))
68 |     args = parser.parse_args(argv)
69 | 
70 |     for f in args.input:
71 |         if f.isatty():
72 |             print("You are running chardetect interactively. Press " +
73 |                   "CTRL-D twice at the start of a blank line to signal the " +
74 |                   "end of your input. If you want help, run chardetect " +
75 |                   "--help\n", file=sys.stderr)
76 |         print(description_of(f, f.name))
77 | 
78 | 
79 | if __name__ == '__main__':
80 |     main()
81 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/charsetgroupprober.py:
--------------------------------------------------------------------------------
  1 | ######################## BEGIN LICENSE BLOCK ########################
  2 | # The Original Code is Mozilla Communicator client code.
  3 | # 
  4 | # The Initial Developer of the Original Code is
  5 | # Netscape Communications Corporation.
  6 | # Portions created by the Initial Developer are Copyright (C) 1998
  7 | # the Initial Developer. All Rights Reserved.
  8 | # 
  9 | # Contributor(s):
 10 | #   Mark Pilgrim - port to Python
 11 | #
 12 | # This library is free software; you can redistribute it and/or
 13 | # modify it under the terms of the GNU Lesser General Public
 14 | # License as published by the Free Software Foundation; either
 15 | # version 2.1 of the License, or (at your option) any later version.
 16 | # 
 17 | # This library is distributed in the hope that it will be useful,
 18 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
 19 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
 20 | # Lesser General Public License for more details.
 21 | # 
 22 | # You should have received a copy of the GNU Lesser General Public
 23 | # License along with this library; if not, write to the Free Software
 24 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
 25 | # 02110-1301  USA
 26 | ######################### END LICENSE BLOCK #########################
 27 | 
 28 | from . import constants
 29 | import sys
 30 | from .charsetprober import CharSetProber
 31 | 
 32 | 
 33 | class CharSetGroupProber(CharSetProber):
 34 |     def __init__(self):
 35 |         CharSetProber.__init__(self)
 36 |         self._mActiveNum = 0
 37 |         self._mProbers = []
 38 |         self._mBestGuessProber = None
 39 | 
 40 |     def reset(self):
 41 |         CharSetProber.reset(self)
 42 |         self._mActiveNum = 0
 43 |         for prober in self._mProbers:
 44 |             if prober:
 45 |                 prober.reset()
 46 |                 prober.active = True
 47 |                 self._mActiveNum += 1
 48 |         self._mBestGuessProber = None
 49 | 
 50 |     def get_charset_name(self):
 51 |         if not self._mBestGuessProber:
 52 |             self.get_confidence()
 53 |             if not self._mBestGuessProber:
 54 |                 return None
 55 | #                self._mBestGuessProber = self._mProbers[0]
 56 |         return self._mBestGuessProber.get_charset_name()
 57 | 
 58 |     def feed(self, aBuf):
 59 |         for prober in self._mProbers:
 60 |             if not prober:
 61 |                 continue
 62 |             if not prober.active:
 63 |                 continue
 64 |             st = prober.feed(aBuf)
 65 |             if not st:
 66 |                 continue
 67 |             if st == constants.eFoundIt:
 68 |                 self._mBestGuessProber = prober
 69 |                 return self.get_state()
 70 |             elif st == constants.eNotMe:
 71 |                 prober.active = False
 72 |                 self._mActiveNum -= 1
 73 |                 if self._mActiveNum <= 0:
 74 |                     self._mState = constants.eNotMe
 75 |                     return self.get_state()
 76 |         return self.get_state()
 77 | 
 78 |     def get_confidence(self):
 79 |         st = self.get_state()
 80 |         if st == constants.eFoundIt:
 81 |             return 0.99
 82 |         elif st == constants.eNotMe:
 83 |             return 0.01
 84 |         bestConf = 0.0
 85 |         self._mBestGuessProber = None
 86 |         for prober in self._mProbers:
 87 |             if not prober:
 88 |                 continue
 89 |             if not prober.active:
 90 |                 if constants._debug:
 91 |                     sys.stderr.write(prober.get_charset_name()
 92 |                                      + ' not active\n')
 93 |                 continue
 94 |             cf = prober.get_confidence()
 95 |             if constants._debug:
 96 |                 sys.stderr.write('%s confidence = %s\n' %
 97 |                                  (prober.get_charset_name(), cf))
 98 |             if bestConf < cf:
 99 |                 bestConf = cf
100 |                 self._mBestGuessProber = prober
101 |         if not self._mBestGuessProber:
102 |             return 0.0
103 |         return bestConf
104 | #        else:
105 | #            self._mBestGuessProber = self._mProbers[0]
106 | #            return self._mBestGuessProber.get_confidence()
107 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/charsetprober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is Mozilla Universal charset detector code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 2001
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #   Shy Shalom - original C code
12 | #
13 | # This library is free software; you can redistribute it and/or
14 | # modify it under the terms of the GNU Lesser General Public
15 | # License as published by the Free Software Foundation; either
16 | # version 2.1 of the License, or (at your option) any later version.
17 | #
18 | # This library is distributed in the hope that it will be useful,
19 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
20 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
21 | # Lesser General Public License for more details.
22 | #
23 | # You should have received a copy of the GNU Lesser General Public
24 | # License along with this library; if not, write to the Free Software
25 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
26 | # 02110-1301  USA
27 | ######################### END LICENSE BLOCK #########################
28 | 
29 | from . import constants
30 | import re
31 | 
32 | 
33 | class CharSetProber:
34 |     def __init__(self):
35 |         pass
36 | 
37 |     def reset(self):
38 |         self._mState = constants.eDetecting
39 | 
40 |     def get_charset_name(self):
41 |         return None
42 | 
43 |     def feed(self, aBuf):
44 |         pass
45 | 
46 |     def get_state(self):
47 |         return self._mState
48 | 
49 |     def get_confidence(self):
50 |         return 0.0
51 | 
52 |     def filter_high_bit_only(self, aBuf):
53 |         aBuf = re.sub(b'([\x00-\x7F])+', b' ', aBuf)
54 |         return aBuf
55 | 
56 |     def filter_without_english_letters(self, aBuf):
57 |         aBuf = re.sub(b'([A-Za-z])+', b' ', aBuf)
58 |         return aBuf
59 | 
60 |     def filter_with_english_letters(self, aBuf):
61 |         # TODO
62 |         return aBuf
63 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/codingstatemachine.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is mozilla.org code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 1998
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #
12 | # This library is free software; you can redistribute it and/or
13 | # modify it under the terms of the GNU Lesser General Public
14 | # License as published by the Free Software Foundation; either
15 | # version 2.1 of the License, or (at your option) any later version.
16 | #
17 | # This library is distributed in the hope that it will be useful,
18 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
19 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20 | # Lesser General Public License for more details.
21 | #
22 | # You should have received a copy of the GNU Lesser General Public
23 | # License along with this library; if not, write to the Free Software
24 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25 | # 02110-1301  USA
26 | ######################### END LICENSE BLOCK #########################
27 | 
28 | from .constants import eStart
29 | from .compat import wrap_ord
30 | 
31 | 
32 | class CodingStateMachine:
33 |     def __init__(self, sm):
34 |         self._mModel = sm
35 |         self._mCurrentBytePos = 0
36 |         self._mCurrentCharLen = 0
37 |         self.reset()
38 | 
39 |     def reset(self):
40 |         self._mCurrentState = eStart
41 | 
42 |     def next_state(self, c):
43 |         # for each byte we get its class
44 |         # if it is first byte, we also get byte length
45 |         # PY3K: aBuf is a byte stream, so c is an int, not a byte
46 |         byteCls = self._mModel['classTable'][wrap_ord(c)]
47 |         if self._mCurrentState == eStart:
48 |             self._mCurrentBytePos = 0
49 |             self._mCurrentCharLen = self._mModel['charLenTable'][byteCls]
50 |         # from byte's class and stateTable, we get its next state
51 |         curr_state = (self._mCurrentState * self._mModel['classFactor']
52 |                       + byteCls)
53 |         self._mCurrentState = self._mModel['stateTable'][curr_state]
54 |         self._mCurrentBytePos += 1
55 |         return self._mCurrentState
56 | 
57 |     def get_current_charlen(self):
58 |         return self._mCurrentCharLen
59 | 
60 |     def get_coding_state_machine(self):
61 |         return self._mModel['name']
62 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/compat.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # Contributor(s):
 3 | #   Ian Cordasco - port to Python
 4 | #
 5 | # This library is free software; you can redistribute it and/or
 6 | # modify it under the terms of the GNU Lesser General Public
 7 | # License as published by the Free Software Foundation; either
 8 | # version 2.1 of the License, or (at your option) any later version.
 9 | #
10 | # This library is distributed in the hope that it will be useful,
11 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
12 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
13 | # Lesser General Public License for more details.
14 | #
15 | # You should have received a copy of the GNU Lesser General Public
16 | # License along with this library; if not, write to the Free Software
17 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
18 | # 02110-1301  USA
19 | ######################### END LICENSE BLOCK #########################
20 | 
21 | import sys
22 | 
23 | 
24 | if sys.version_info < (3, 0):
25 |     base_str = (str, unicode)
26 | else:
27 |     base_str = (bytes, str)
28 | 
29 | 
30 | def wrap_ord(a):
31 |     if sys.version_info < (3, 0) and isinstance(a, base_str):
32 |         return ord(a)
33 |     else:
34 |         return a
35 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/constants.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is Mozilla Universal charset detector code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 2001
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #   Shy Shalom - original C code
12 | #
13 | # This library is free software; you can redistribute it and/or
14 | # modify it under the terms of the GNU Lesser General Public
15 | # License as published by the Free Software Foundation; either
16 | # version 2.1 of the License, or (at your option) any later version.
17 | # 
18 | # This library is distributed in the hope that it will be useful,
19 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
20 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
21 | # Lesser General Public License for more details.
22 | # 
23 | # You should have received a copy of the GNU Lesser General Public
24 | # License along with this library; if not, write to the Free Software
25 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
26 | # 02110-1301  USA
27 | ######################### END LICENSE BLOCK #########################
28 | 
29 | _debug = 0
30 | 
31 | eDetecting = 0
32 | eFoundIt = 1
33 | eNotMe = 2
34 | 
35 | eStart = 0
36 | eError = 1
37 | eItsMe = 2
38 | 
39 | SHORTCUT_THRESHOLD = 0.95
40 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/cp949prober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is mozilla.org code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 1998
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #
12 | # This library is free software; you can redistribute it and/or
13 | # modify it under the terms of the GNU Lesser General Public
14 | # License as published by the Free Software Foundation; either
15 | # version 2.1 of the License, or (at your option) any later version.
16 | #
17 | # This library is distributed in the hope that it will be useful,
18 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
19 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20 | # Lesser General Public License for more details.
21 | #
22 | # You should have received a copy of the GNU Lesser General Public
23 | # License along with this library; if not, write to the Free Software
24 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25 | # 02110-1301  USA
26 | ######################### END LICENSE BLOCK #########################
27 | 
28 | from .mbcharsetprober import MultiByteCharSetProber
29 | from .codingstatemachine import CodingStateMachine
30 | from .chardistribution import EUCKRDistributionAnalysis
31 | from .mbcssm import CP949SMModel
32 | 
33 | 
34 | class CP949Prober(MultiByteCharSetProber):
35 |     def __init__(self):
36 |         MultiByteCharSetProber.__init__(self)
37 |         self._mCodingSM = CodingStateMachine(CP949SMModel)
38 |         # NOTE: CP949 is a superset of EUC-KR, so the distribution should be
39 |         #       not different.
40 |         self._mDistributionAnalyzer = EUCKRDistributionAnalysis()
41 |         self.reset()
42 | 
43 |     def get_charset_name(self):
44 |         return "CP949"
45 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/escprober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is mozilla.org code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 1998
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #
12 | # This library is free software; you can redistribute it and/or
13 | # modify it under the terms of the GNU Lesser General Public
14 | # License as published by the Free Software Foundation; either
15 | # version 2.1 of the License, or (at your option) any later version.
16 | #
17 | # This library is distributed in the hope that it will be useful,
18 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
19 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20 | # Lesser General Public License for more details.
21 | #
22 | # You should have received a copy of the GNU Lesser General Public
23 | # License along with this library; if not, write to the Free Software
24 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25 | # 02110-1301  USA
26 | ######################### END LICENSE BLOCK #########################
27 | 
28 | from . import constants
29 | from .escsm import (HZSMModel, ISO2022CNSMModel, ISO2022JPSMModel,
30 |                     ISO2022KRSMModel)
31 | from .charsetprober import CharSetProber
32 | from .codingstatemachine import CodingStateMachine
33 | from .compat import wrap_ord
34 | 
35 | 
36 | class EscCharSetProber(CharSetProber):
37 |     def __init__(self):
38 |         CharSetProber.__init__(self)
39 |         self._mCodingSM = [
40 |             CodingStateMachine(HZSMModel),
41 |             CodingStateMachine(ISO2022CNSMModel),
42 |             CodingStateMachine(ISO2022JPSMModel),
43 |             CodingStateMachine(ISO2022KRSMModel)
44 |         ]
45 |         self.reset()
46 | 
47 |     def reset(self):
48 |         CharSetProber.reset(self)
49 |         for codingSM in self._mCodingSM:
50 |             if not codingSM:
51 |                 continue
52 |             codingSM.active = True
53 |             codingSM.reset()
54 |         self._mActiveSM = len(self._mCodingSM)
55 |         self._mDetectedCharset = None
56 | 
57 |     def get_charset_name(self):
58 |         return self._mDetectedCharset
59 | 
60 |     def get_confidence(self):
61 |         if self._mDetectedCharset:
62 |             return 0.99
63 |         else:
64 |             return 0.00
65 | 
66 |     def feed(self, aBuf):
67 |         for c in aBuf:
68 |             # PY3K: aBuf is a byte array, so c is an int, not a byte
69 |             for codingSM in self._mCodingSM:
70 |                 if not codingSM:
71 |                     continue
72 |                 if not codingSM.active:
73 |                     continue
74 |                 codingState = codingSM.next_state(wrap_ord(c))
75 |                 if codingState == constants.eError:
76 |                     codingSM.active = False
77 |                     self._mActiveSM -= 1
78 |                     if self._mActiveSM <= 0:
79 |                         self._mState = constants.eNotMe
80 |                         return self.get_state()
81 |                 elif codingState == constants.eItsMe:
82 |                     self._mState = constants.eFoundIt
83 |                     self._mDetectedCharset = codingSM.get_coding_state_machine()  # nopep8
84 |                     return self.get_state()
85 | 
86 |         return self.get_state()
87 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/eucjpprober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is mozilla.org code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 1998
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #
12 | # This library is free software; you can redistribute it and/or
13 | # modify it under the terms of the GNU Lesser General Public
14 | # License as published by the Free Software Foundation; either
15 | # version 2.1 of the License, or (at your option) any later version.
16 | #
17 | # This library is distributed in the hope that it will be useful,
18 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
19 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20 | # Lesser General Public License for more details.
21 | #
22 | # You should have received a copy of the GNU Lesser General Public
23 | # License along with this library; if not, write to the Free Software
24 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25 | # 02110-1301  USA
26 | ######################### END LICENSE BLOCK #########################
27 | 
28 | import sys
29 | from . import constants
30 | from .mbcharsetprober import MultiByteCharSetProber
31 | from .codingstatemachine import CodingStateMachine
32 | from .chardistribution import EUCJPDistributionAnalysis
33 | from .jpcntx import EUCJPContextAnalysis
34 | from .mbcssm import EUCJPSMModel
35 | 
36 | 
37 | class EUCJPProber(MultiByteCharSetProber):
38 |     def __init__(self):
39 |         MultiByteCharSetProber.__init__(self)
40 |         self._mCodingSM = CodingStateMachine(EUCJPSMModel)
41 |         self._mDistributionAnalyzer = EUCJPDistributionAnalysis()
42 |         self._mContextAnalyzer = EUCJPContextAnalysis()
43 |         self.reset()
44 | 
45 |     def reset(self):
46 |         MultiByteCharSetProber.reset(self)
47 |         self._mContextAnalyzer.reset()
48 | 
49 |     def get_charset_name(self):
50 |         return "EUC-JP"
51 | 
52 |     def feed(self, aBuf):
53 |         aLen = len(aBuf)
54 |         for i in range(0, aLen):
55 |             # PY3K: aBuf is a byte array, so aBuf[i] is an int, not a byte
56 |             codingState = self._mCodingSM.next_state(aBuf[i])
57 |             if codingState == constants.eError:
58 |                 if constants._debug:
59 |                     sys.stderr.write(self.get_charset_name()
60 |                                      + ' prober hit error at byte ' + str(i)
61 |                                      + '\n')
62 |                 self._mState = constants.eNotMe
63 |                 break
64 |             elif codingState == constants.eItsMe:
65 |                 self._mState = constants.eFoundIt
66 |                 break
67 |             elif codingState == constants.eStart:
68 |                 charLen = self._mCodingSM.get_current_charlen()
69 |                 if i == 0:
70 |                     self._mLastChar[1] = aBuf[0]
71 |                     self._mContextAnalyzer.feed(self._mLastChar, charLen)
72 |                     self._mDistributionAnalyzer.feed(self._mLastChar, charLen)
73 |                 else:
74 |                     self._mContextAnalyzer.feed(aBuf[i - 1:i + 1], charLen)
75 |                     self._mDistributionAnalyzer.feed(aBuf[i - 1:i + 1],
76 |                                                      charLen)
77 | 
78 |         self._mLastChar[0] = aBuf[aLen - 1]
79 | 
80 |         if self.get_state() == constants.eDetecting:
81 |             if (self._mContextAnalyzer.got_enough_data() and
82 |                (self.get_confidence() > constants.SHORTCUT_THRESHOLD)):
83 |                 self._mState = constants.eFoundIt
84 | 
85 |         return self.get_state()
86 | 
87 |     def get_confidence(self):
88 |         contxtCf = self._mContextAnalyzer.get_confidence()
89 |         distribCf = self._mDistributionAnalyzer.get_confidence()
90 |         return max(contxtCf, distribCf)
91 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/euckrprober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is mozilla.org code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 1998
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #
12 | # This library is free software; you can redistribute it and/or
13 | # modify it under the terms of the GNU Lesser General Public
14 | # License as published by the Free Software Foundation; either
15 | # version 2.1 of the License, or (at your option) any later version.
16 | #
17 | # This library is distributed in the hope that it will be useful,
18 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
19 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20 | # Lesser General Public License for more details.
21 | #
22 | # You should have received a copy of the GNU Lesser General Public
23 | # License along with this library; if not, write to the Free Software
24 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25 | # 02110-1301  USA
26 | ######################### END LICENSE BLOCK #########################
27 | 
28 | from .mbcharsetprober import MultiByteCharSetProber
29 | from .codingstatemachine import CodingStateMachine
30 | from .chardistribution import EUCKRDistributionAnalysis
31 | from .mbcssm import EUCKRSMModel
32 | 
33 | 
34 | class EUCKRProber(MultiByteCharSetProber):
35 |     def __init__(self):
36 |         MultiByteCharSetProber.__init__(self)
37 |         self._mCodingSM = CodingStateMachine(EUCKRSMModel)
38 |         self._mDistributionAnalyzer = EUCKRDistributionAnalysis()
39 |         self.reset()
40 | 
41 |     def get_charset_name(self):
42 |         return "EUC-KR"
43 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/euctwprober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is mozilla.org code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 1998
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #
12 | # This library is free software; you can redistribute it and/or
13 | # modify it under the terms of the GNU Lesser General Public
14 | # License as published by the Free Software Foundation; either
15 | # version 2.1 of the License, or (at your option) any later version.
16 | # 
17 | # This library is distributed in the hope that it will be useful,
18 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
19 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20 | # Lesser General Public License for more details.
21 | # 
22 | # You should have received a copy of the GNU Lesser General Public
23 | # License along with this library; if not, write to the Free Software
24 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25 | # 02110-1301  USA
26 | ######################### END LICENSE BLOCK #########################
27 | 
28 | from .mbcharsetprober import MultiByteCharSetProber
29 | from .codingstatemachine import CodingStateMachine
30 | from .chardistribution import EUCTWDistributionAnalysis
31 | from .mbcssm import EUCTWSMModel
32 | 
33 | class EUCTWProber(MultiByteCharSetProber):
34 |     def __init__(self):
35 |         MultiByteCharSetProber.__init__(self)
36 |         self._mCodingSM = CodingStateMachine(EUCTWSMModel)
37 |         self._mDistributionAnalyzer = EUCTWDistributionAnalysis()
38 |         self.reset()
39 | 
40 |     def get_charset_name(self):
41 |         return "EUC-TW"
42 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/gb2312prober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is mozilla.org code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 1998
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #
12 | # This library is free software; you can redistribute it and/or
13 | # modify it under the terms of the GNU Lesser General Public
14 | # License as published by the Free Software Foundation; either
15 | # version 2.1 of the License, or (at your option) any later version.
16 | # 
17 | # This library is distributed in the hope that it will be useful,
18 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
19 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20 | # Lesser General Public License for more details.
21 | # 
22 | # You should have received a copy of the GNU Lesser General Public
23 | # License along with this library; if not, write to the Free Software
24 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25 | # 02110-1301  USA
26 | ######################### END LICENSE BLOCK #########################
27 | 
28 | from .mbcharsetprober import MultiByteCharSetProber
29 | from .codingstatemachine import CodingStateMachine
30 | from .chardistribution import GB2312DistributionAnalysis
31 | from .mbcssm import GB2312SMModel
32 | 
33 | class GB2312Prober(MultiByteCharSetProber):
34 |     def __init__(self):
35 |         MultiByteCharSetProber.__init__(self)
36 |         self._mCodingSM = CodingStateMachine(GB2312SMModel)
37 |         self._mDistributionAnalyzer = GB2312DistributionAnalysis()
38 |         self.reset()
39 | 
40 |     def get_charset_name(self):
41 |         return "GB2312"
42 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/mbcharsetprober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is Mozilla Universal charset detector code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 2001
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #   Shy Shalom - original C code
12 | #   Proofpoint, Inc.
13 | #
14 | # This library is free software; you can redistribute it and/or
15 | # modify it under the terms of the GNU Lesser General Public
16 | # License as published by the Free Software Foundation; either
17 | # version 2.1 of the License, or (at your option) any later version.
18 | #
19 | # This library is distributed in the hope that it will be useful,
20 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
21 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
22 | # Lesser General Public License for more details.
23 | #
24 | # You should have received a copy of the GNU Lesser General Public
25 | # License along with this library; if not, write to the Free Software
26 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
27 | # 02110-1301  USA
28 | ######################### END LICENSE BLOCK #########################
29 | 
30 | import sys
31 | from . import constants
32 | from .charsetprober import CharSetProber
33 | 
34 | 
35 | class MultiByteCharSetProber(CharSetProber):
36 |     def __init__(self):
37 |         CharSetProber.__init__(self)
38 |         self._mDistributionAnalyzer = None
39 |         self._mCodingSM = None
40 |         self._mLastChar = [0, 0]
41 | 
42 |     def reset(self):
43 |         CharSetProber.reset(self)
44 |         if self._mCodingSM:
45 |             self._mCodingSM.reset()
46 |         if self._mDistributionAnalyzer:
47 |             self._mDistributionAnalyzer.reset()
48 |         self._mLastChar = [0, 0]
49 | 
50 |     def get_charset_name(self):
51 |         pass
52 | 
53 |     def feed(self, aBuf):
54 |         aLen = len(aBuf)
55 |         for i in range(0, aLen):
56 |             codingState = self._mCodingSM.next_state(aBuf[i])
57 |             if codingState == constants.eError:
58 |                 if constants._debug:
59 |                     sys.stderr.write(self.get_charset_name()
60 |                                      + ' prober hit error at byte ' + str(i)
61 |                                      + '\n')
62 |                 self._mState = constants.eNotMe
63 |                 break
64 |             elif codingState == constants.eItsMe:
65 |                 self._mState = constants.eFoundIt
66 |                 break
67 |             elif codingState == constants.eStart:
68 |                 charLen = self._mCodingSM.get_current_charlen()
69 |                 if i == 0:
70 |                     self._mLastChar[1] = aBuf[0]
71 |                     self._mDistributionAnalyzer.feed(self._mLastChar, charLen)
72 |                 else:
73 |                     self._mDistributionAnalyzer.feed(aBuf[i - 1:i + 1],
74 |                                                      charLen)
75 | 
76 |         self._mLastChar[0] = aBuf[aLen - 1]
77 | 
78 |         if self.get_state() == constants.eDetecting:
79 |             if (self._mDistributionAnalyzer.got_enough_data() and
80 |                     (self.get_confidence() > constants.SHORTCUT_THRESHOLD)):
81 |                 self._mState = constants.eFoundIt
82 | 
83 |         return self.get_state()
84 | 
85 |     def get_confidence(self):
86 |         return self._mDistributionAnalyzer.get_confidence()
87 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/mbcsgroupprober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is Mozilla Universal charset detector code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 2001
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #   Shy Shalom - original C code
12 | #   Proofpoint, Inc.
13 | #
14 | # This library is free software; you can redistribute it and/or
15 | # modify it under the terms of the GNU Lesser General Public
16 | # License as published by the Free Software Foundation; either
17 | # version 2.1 of the License, or (at your option) any later version.
18 | #
19 | # This library is distributed in the hope that it will be useful,
20 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
21 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
22 | # Lesser General Public License for more details.
23 | #
24 | # You should have received a copy of the GNU Lesser General Public
25 | # License along with this library; if not, write to the Free Software
26 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
27 | # 02110-1301  USA
28 | ######################### END LICENSE BLOCK #########################
29 | 
30 | from .charsetgroupprober import CharSetGroupProber
31 | from .utf8prober import UTF8Prober
32 | from .sjisprober import SJISProber
33 | from .eucjpprober import EUCJPProber
34 | from .gb2312prober import GB2312Prober
35 | from .euckrprober import EUCKRProber
36 | from .cp949prober import CP949Prober
37 | from .big5prober import Big5Prober
38 | from .euctwprober import EUCTWProber
39 | 
40 | 
41 | class MBCSGroupProber(CharSetGroupProber):
42 |     def __init__(self):
43 |         CharSetGroupProber.__init__(self)
44 |         self._mProbers = [
45 |             UTF8Prober(),
46 |             SJISProber(),
47 |             EUCJPProber(),
48 |             GB2312Prober(),
49 |             EUCKRProber(),
50 |             CP949Prober(),
51 |             Big5Prober(),
52 |             EUCTWProber()
53 |         ]
54 |         self.reset()
55 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/sbcsgroupprober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is Mozilla Universal charset detector code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 2001
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #   Shy Shalom - original C code
12 | #
13 | # This library is free software; you can redistribute it and/or
14 | # modify it under the terms of the GNU Lesser General Public
15 | # License as published by the Free Software Foundation; either
16 | # version 2.1 of the License, or (at your option) any later version.
17 | #
18 | # This library is distributed in the hope that it will be useful,
19 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
20 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
21 | # Lesser General Public License for more details.
22 | #
23 | # You should have received a copy of the GNU Lesser General Public
24 | # License along with this library; if not, write to the Free Software
25 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
26 | # 02110-1301  USA
27 | ######################### END LICENSE BLOCK #########################
28 | 
29 | from .charsetgroupprober import CharSetGroupProber
30 | from .sbcharsetprober import SingleByteCharSetProber
31 | from .langcyrillicmodel import (Win1251CyrillicModel, Koi8rModel,
32 |                                 Latin5CyrillicModel, MacCyrillicModel,
33 |                                 Ibm866Model, Ibm855Model)
34 | from .langgreekmodel import Latin7GreekModel, Win1253GreekModel
35 | from .langbulgarianmodel import Latin5BulgarianModel, Win1251BulgarianModel
36 | from .langhungarianmodel import Latin2HungarianModel, Win1250HungarianModel
37 | from .langthaimodel import TIS620ThaiModel
38 | from .langhebrewmodel import Win1255HebrewModel
39 | from .hebrewprober import HebrewProber
40 | 
41 | 
42 | class SBCSGroupProber(CharSetGroupProber):
43 |     def __init__(self):
44 |         CharSetGroupProber.__init__(self)
45 |         self._mProbers = [
46 |             SingleByteCharSetProber(Win1251CyrillicModel),
47 |             SingleByteCharSetProber(Koi8rModel),
48 |             SingleByteCharSetProber(Latin5CyrillicModel),
49 |             SingleByteCharSetProber(MacCyrillicModel),
50 |             SingleByteCharSetProber(Ibm866Model),
51 |             SingleByteCharSetProber(Ibm855Model),
52 |             SingleByteCharSetProber(Latin7GreekModel),
53 |             SingleByteCharSetProber(Win1253GreekModel),
54 |             SingleByteCharSetProber(Latin5BulgarianModel),
55 |             SingleByteCharSetProber(Win1251BulgarianModel),
56 |             SingleByteCharSetProber(Latin2HungarianModel),
57 |             SingleByteCharSetProber(Win1250HungarianModel),
58 |             SingleByteCharSetProber(TIS620ThaiModel),
59 |         ]
60 |         hebrewProber = HebrewProber()
61 |         logicalHebrewProber = SingleByteCharSetProber(Win1255HebrewModel,
62 |                                                       False, hebrewProber)
63 |         visualHebrewProber = SingleByteCharSetProber(Win1255HebrewModel, True,
64 |                                                      hebrewProber)
65 |         hebrewProber.set_model_probers(logicalHebrewProber, visualHebrewProber)
66 |         self._mProbers.extend([hebrewProber, logicalHebrewProber,
67 |                                visualHebrewProber])
68 | 
69 |         self.reset()
70 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/sjisprober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is mozilla.org code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 1998
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #
12 | # This library is free software; you can redistribute it and/or
13 | # modify it under the terms of the GNU Lesser General Public
14 | # License as published by the Free Software Foundation; either
15 | # version 2.1 of the License, or (at your option) any later version.
16 | #
17 | # This library is distributed in the hope that it will be useful,
18 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
19 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20 | # Lesser General Public License for more details.
21 | #
22 | # You should have received a copy of the GNU Lesser General Public
23 | # License along with this library; if not, write to the Free Software
24 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25 | # 02110-1301  USA
26 | ######################### END LICENSE BLOCK #########################
27 | 
28 | import sys
29 | from .mbcharsetprober import MultiByteCharSetProber
30 | from .codingstatemachine import CodingStateMachine
31 | from .chardistribution import SJISDistributionAnalysis
32 | from .jpcntx import SJISContextAnalysis
33 | from .mbcssm import SJISSMModel
34 | from . import constants
35 | 
36 | 
37 | class SJISProber(MultiByteCharSetProber):
38 |     def __init__(self):
39 |         MultiByteCharSetProber.__init__(self)
40 |         self._mCodingSM = CodingStateMachine(SJISSMModel)
41 |         self._mDistributionAnalyzer = SJISDistributionAnalysis()
42 |         self._mContextAnalyzer = SJISContextAnalysis()
43 |         self.reset()
44 | 
45 |     def reset(self):
46 |         MultiByteCharSetProber.reset(self)
47 |         self._mContextAnalyzer.reset()
48 | 
49 |     def get_charset_name(self):
50 |         return self._mContextAnalyzer.get_charset_name()
51 | 
52 |     def feed(self, aBuf):
53 |         aLen = len(aBuf)
54 |         for i in range(0, aLen):
55 |             codingState = self._mCodingSM.next_state(aBuf[i])
56 |             if codingState == constants.eError:
57 |                 if constants._debug:
58 |                     sys.stderr.write(self.get_charset_name()
59 |                                      + ' prober hit error at byte ' + str(i)
60 |                                      + '\n')
61 |                 self._mState = constants.eNotMe
62 |                 break
63 |             elif codingState == constants.eItsMe:
64 |                 self._mState = constants.eFoundIt
65 |                 break
66 |             elif codingState == constants.eStart:
67 |                 charLen = self._mCodingSM.get_current_charlen()
68 |                 if i == 0:
69 |                     self._mLastChar[1] = aBuf[0]
70 |                     self._mContextAnalyzer.feed(self._mLastChar[2 - charLen:],
71 |                                                 charLen)
72 |                     self._mDistributionAnalyzer.feed(self._mLastChar, charLen)
73 |                 else:
74 |                     self._mContextAnalyzer.feed(aBuf[i + 1 - charLen:i + 3
75 |                                                      - charLen], charLen)
76 |                     self._mDistributionAnalyzer.feed(aBuf[i - 1:i + 1],
77 |                                                      charLen)
78 | 
79 |         self._mLastChar[0] = aBuf[aLen - 1]
80 | 
81 |         if self.get_state() == constants.eDetecting:
82 |             if (self._mContextAnalyzer.got_enough_data() and
83 |                (self.get_confidence() > constants.SHORTCUT_THRESHOLD)):
84 |                 self._mState = constants.eFoundIt
85 | 
86 |         return self.get_state()
87 | 
88 |     def get_confidence(self):
89 |         contxtCf = self._mContextAnalyzer.get_confidence()
90 |         distribCf = self._mDistributionAnalyzer.get_confidence()
91 |         return max(contxtCf, distribCf)
92 | 


--------------------------------------------------------------------------------
/requests/packages/chardet/utf8prober.py:
--------------------------------------------------------------------------------
 1 | ######################## BEGIN LICENSE BLOCK ########################
 2 | # The Original Code is mozilla.org code.
 3 | #
 4 | # The Initial Developer of the Original Code is
 5 | # Netscape Communications Corporation.
 6 | # Portions created by the Initial Developer are Copyright (C) 1998
 7 | # the Initial Developer. All Rights Reserved.
 8 | #
 9 | # Contributor(s):
10 | #   Mark Pilgrim - port to Python
11 | #
12 | # This library is free software; you can redistribute it and/or
13 | # modify it under the terms of the GNU Lesser General Public
14 | # License as published by the Free Software Foundation; either
15 | # version 2.1 of the License, or (at your option) any later version.
16 | #
17 | # This library is distributed in the hope that it will be useful,
18 | # but WITHOUT ANY WARRANTY; without even the implied warranty of
19 | # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
20 | # Lesser General Public License for more details.
21 | #
22 | # You should have received a copy of the GNU Lesser General Public
23 | # License along with this library; if not, write to the Free Software
24 | # Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
25 | # 02110-1301  USA
26 | ######################### END LICENSE BLOCK #########################
27 | 
28 | from . import constants
29 | from .charsetprober import CharSetProber
30 | from .codingstatemachine import CodingStateMachine
31 | from .mbcssm import UTF8SMModel
32 | 
33 | ONE_CHAR_PROB = 0.5
34 | 
35 | 
36 | class UTF8Prober(CharSetProber):
37 |     def __init__(self):
38 |         CharSetProber.__init__(self)
39 |         self._mCodingSM = CodingStateMachine(UTF8SMModel)
40 |         self.reset()
41 | 
42 |     def reset(self):
43 |         CharSetProber.reset(self)
44 |         self._mCodingSM.reset()
45 |         self._mNumOfMBChar = 0
46 | 
47 |     def get_charset_name(self):
48 |         return "utf-8"
49 | 
50 |     def feed(self, aBuf):
51 |         for c in aBuf:
52 |             codingState = self._mCodingSM.next_state(c)
53 |             if codingState == constants.eError:
54 |                 self._mState = constants.eNotMe
55 |                 break
56 |             elif codingState == constants.eItsMe:
57 |                 self._mState = constants.eFoundIt
58 |                 break
59 |             elif codingState == constants.eStart:
60 |                 if self._mCodingSM.get_current_charlen() >= 2:
61 |                     self._mNumOfMBChar += 1
62 | 
63 |         if self.get_state() == constants.eDetecting:
64 |             if self.get_confidence() > constants.SHORTCUT_THRESHOLD:
65 |                 self._mState = constants.eFoundIt
66 | 
67 |         return self.get_state()
68 | 
69 |     def get_confidence(self):
70 |         unlike = 0.99
71 |         if self._mNumOfMBChar < 6:
72 |             for i in range(0, self._mNumOfMBChar):
73 |                 unlike = unlike * ONE_CHAR_PROB
74 |             return 1.0 - unlike
75 |         else:
76 |             return unlike
77 | 


--------------------------------------------------------------------------------
/requests/packages/urllib3/__init__.py:
--------------------------------------------------------------------------------
 1 | """
 2 | urllib3 - Thread-safe connection pooling and re-using.
 3 | """
 4 | 
 5 | __author__ = 'Andrey Petrov (andrey.petrov@shazow.net)'
 6 | __license__ = 'MIT'
 7 | __version__ = '1.10.4'
 8 | 
 9 | 
10 | from .connectionpool import (
11 |     HTTPConnectionPool,
12 |     HTTPSConnectionPool,
13 |     connection_from_url
14 | )
15 | 
16 | from . import exceptions
17 | from .filepost import encode_multipart_formdata
18 | from .poolmanager import PoolManager, ProxyManager, proxy_from_url
19 | from .response import HTTPResponse
20 | from .util.request import make_headers
21 | from .util.url import get_host
22 | from .util.timeout import Timeout
23 | from .util.retry import Retry
24 | 
25 | 
26 | # Set default logging handler to avoid "No handler found" warnings.
27 | import logging
28 | try:  # Python 2.7+
29 |     from logging import NullHandler
30 | except ImportError:
31 |     class NullHandler(logging.Handler):
32 |         def emit(self, record):
33 |             pass
34 | 
35 | logging.getLogger(__name__).addHandler(NullHandler())
36 | 
37 | def add_stderr_logger(level=logging.DEBUG):
38 |     """
39 |     Helper for quickly adding a StreamHandler to the logger. Useful for
40 |     debugging.
41 | 
42 |     Returns the handler after adding it.
43 |     """
44 |     # This method needs to be in this __init__.py to get the __name__ correct
45 |     # even if urllib3 is vendored within another package.
46 |     logger = logging.getLogger(__name__)
47 |     handler = logging.StreamHandler()
48 |     handler.setFormatter(logging.Formatter('%(asctime)s %(levelname)s %(message)s'))
49 |     logger.addHandler(handler)
50 |     logger.setLevel(level)
51 |     logger.debug('Added a stderr logging handler to logger: %s' % __name__)
52 |     return handler
53 | 
54 | # ... Clean up.
55 | del NullHandler
56 | 
57 | 
58 | import warnings
59 | # SecurityWarning's always go off by default.
60 | warnings.simplefilter('always', exceptions.SecurityWarning, append=True)
61 | # InsecurePlatformWarning's don't vary between requests, so we keep it default.
62 | warnings.simplefilter('default', exceptions.InsecurePlatformWarning,
63 |                       append=True)
64 | 
65 | def disable_warnings(category=exceptions.HTTPWarning):
66 |     """
67 |     Helper for quickly disabling all urllib3 warnings.
68 |     """
69 |     warnings.simplefilter('ignore', category)
70 | 


--------------------------------------------------------------------------------
/requests/packages/urllib3/contrib/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/requests/packages/urllib3/contrib/__init__.py


--------------------------------------------------------------------------------
/requests/packages/urllib3/contrib/ntlmpool.py:
--------------------------------------------------------------------------------
  1 | """
  2 | NTLM authenticating pool, contributed by erikcederstran
  3 | 
  4 | Issue #10, see: http://code.google.com/p/urllib3/issues/detail?id=10
  5 | """
  6 | 
  7 | try:
  8 |     from http.client import HTTPSConnection
  9 | except ImportError:
 10 |     from httplib import HTTPSConnection
 11 | from logging import getLogger
 12 | from ntlm import ntlm
 13 | 
 14 | from urllib3 import HTTPSConnectionPool
 15 | 
 16 | 
 17 | log = getLogger(__name__)
 18 | 
 19 | 
 20 | class NTLMConnectionPool(HTTPSConnectionPool):
 21 |     """
 22 |     Implements an NTLM authentication version of an urllib3 connection pool
 23 |     """
 24 | 
 25 |     scheme = 'https'
 26 | 
 27 |     def __init__(self, user, pw, authurl, *args, **kwargs):
 28 |         """
 29 |         authurl is a random URL on the server that is protected by NTLM.
 30 |         user is the Windows user, probably in the DOMAIN\\username format.
 31 |         pw is the password for the user.
 32 |         """
 33 |         super(NTLMConnectionPool, self).__init__(*args, **kwargs)
 34 |         self.authurl = authurl
 35 |         self.rawuser = user
 36 |         user_parts = user.split('\\', 1)
 37 |         self.domain = user_parts[0].upper()
 38 |         self.user = user_parts[1]
 39 |         self.pw = pw
 40 | 
 41 |     def _new_conn(self):
 42 |         # Performs the NTLM handshake that secures the connection. The socket
 43 |         # must be kept open while requests are performed.
 44 |         self.num_connections += 1
 45 |         log.debug('Starting NTLM HTTPS connection no. %d: https://%s%s' %
 46 |                   (self.num_connections, self.host, self.authurl))
 47 | 
 48 |         headers = {}
 49 |         headers['Connection'] = 'Keep-Alive'
 50 |         req_header = 'Authorization'
 51 |         resp_header = 'www-authenticate'
 52 | 
 53 |         conn = HTTPSConnection(host=self.host, port=self.port)
 54 | 
 55 |         # Send negotiation message
 56 |         headers[req_header] = (
 57 |             'NTLM %s' % ntlm.create_NTLM_NEGOTIATE_MESSAGE(self.rawuser))
 58 |         log.debug('Request headers: %s' % headers)
 59 |         conn.request('GET', self.authurl, None, headers)
 60 |         res = conn.getresponse()
 61 |         reshdr = dict(res.getheaders())
 62 |         log.debug('Response status: %s %s' % (res.status, res.reason))
 63 |         log.debug('Response headers: %s' % reshdr)
 64 |         log.debug('Response data: %s [...]' % res.read(100))
 65 | 
 66 |         # Remove the reference to the socket, so that it can not be closed by
 67 |         # the response object (we want to keep the socket open)
 68 |         res.fp = None
 69 | 
 70 |         # Server should respond with a challenge message
 71 |         auth_header_values = reshdr[resp_header].split(', ')
 72 |         auth_header_value = None
 73 |         for s in auth_header_values:
 74 |             if s[:5] == 'NTLM ':
 75 |                 auth_header_value = s[5:]
 76 |         if auth_header_value is None:
 77 |             raise Exception('Unexpected %s response header: %s' %
 78 |                             (resp_header, reshdr[resp_header]))
 79 | 
 80 |         # Send authentication message
 81 |         ServerChallenge, NegotiateFlags = \
 82 |             ntlm.parse_NTLM_CHALLENGE_MESSAGE(auth_header_value)
 83 |         auth_msg = ntlm.create_NTLM_AUTHENTICATE_MESSAGE(ServerChallenge,
 84 |                                                          self.user,
 85 |                                                          self.domain,
 86 |                                                          self.pw,
 87 |                                                          NegotiateFlags)
 88 |         headers[req_header] = 'NTLM %s' % auth_msg
 89 |         log.debug('Request headers: %s' % headers)
 90 |         conn.request('GET', self.authurl, None, headers)
 91 |         res = conn.getresponse()
 92 |         log.debug('Response status: %s %s' % (res.status, res.reason))
 93 |         log.debug('Response headers: %s' % dict(res.getheaders()))
 94 |         log.debug('Response data: %s [...]' % res.read()[:100])
 95 |         if res.status != 200:
 96 |             if res.status == 401:
 97 |                 raise Exception('Server rejected request: wrong '
 98 |                                 'username or password')
 99 |             raise Exception('Wrong server response: %s %s' %
100 |                             (res.status, res.reason))
101 | 
102 |         res.fp = None
103 |         log.debug('Connection established')
104 |         return conn
105 | 
106 |     def urlopen(self, method, url, body=None, headers=None, retries=3,
107 |                 redirect=True, assert_same_host=True):
108 |         if headers is None:
109 |             headers = {}
110 |         headers['Connection'] = 'Keep-Alive'
111 |         return super(NTLMConnectionPool, self).urlopen(method, url, body,
112 |                                                        headers, retries,
113 |                                                        redirect,
114 |                                                        assert_same_host)
115 | 


--------------------------------------------------------------------------------
/requests/packages/urllib3/filepost.py:
--------------------------------------------------------------------------------
 1 | import codecs
 2 | 
 3 | from uuid import uuid4
 4 | from io import BytesIO
 5 | 
 6 | from .packages import six
 7 | from .packages.six import b
 8 | from .fields import RequestField
 9 | 
10 | writer = codecs.lookup('utf-8')[3]
11 | 
12 | 
13 | def choose_boundary():
14 |     """
15 |     Our embarassingly-simple replacement for mimetools.choose_boundary.
16 |     """
17 |     return uuid4().hex
18 | 
19 | 
20 | def iter_field_objects(fields):
21 |     """
22 |     Iterate over fields.
23 | 
24 |     Supports list of (k, v) tuples and dicts, and lists of
25 |     :class:`~urllib3.fields.RequestField`.
26 | 
27 |     """
28 |     if isinstance(fields, dict):
29 |         i = six.iteritems(fields)
30 |     else:
31 |         i = iter(fields)
32 | 
33 |     for field in i:
34 |         if isinstance(field, RequestField):
35 |             yield field
36 |         else:
37 |             yield RequestField.from_tuples(*field)
38 | 
39 | 
40 | def iter_fields(fields):
41 |     """
42 |     .. deprecated:: 1.6
43 | 
44 |     Iterate over fields.
45 | 
46 |     The addition of :class:`~urllib3.fields.RequestField` makes this function
47 |     obsolete. Instead, use :func:`iter_field_objects`, which returns
48 |     :class:`~urllib3.fields.RequestField` objects.
49 | 
50 |     Supports list of (k, v) tuples and dicts.
51 |     """
52 |     if isinstance(fields, dict):
53 |         return ((k, v) for k, v in six.iteritems(fields))
54 | 
55 |     return ((k, v) for k, v in fields)
56 | 
57 | 
58 | def encode_multipart_formdata(fields, boundary=None):
59 |     """
60 |     Encode a dictionary of ``fields`` using the multipart/form-data MIME format.
61 | 
62 |     :param fields:
63 |         Dictionary of fields or list of (key, :class:`~urllib3.fields.RequestField`).
64 | 
65 |     :param boundary:
66 |         If not specified, then a random boundary will be generated using
67 |         :func:`mimetools.choose_boundary`.
68 |     """
69 |     body = BytesIO()
70 |     if boundary is None:
71 |         boundary = choose_boundary()
72 | 
73 |     for field in iter_field_objects(fields):
74 |         body.write(b('--%s\r\n' % (boundary)))
75 | 
76 |         writer(body).write(field.render_headers())
77 |         data = field.data
78 | 
79 |         if isinstance(data, int):
80 |             data = str(data)  # Backwards compatibility
81 | 
82 |         if isinstance(data, six.text_type):
83 |             writer(body).write(data)
84 |         else:
85 |             body.write(data)
86 | 
87 |         body.write(b'\r\n')
88 | 
89 |     body.write(b('--%s--\r\n' % (boundary)))
90 | 
91 |     content_type = str('multipart/form-data; boundary=%s' % boundary)
92 | 
93 |     return body.getvalue(), content_type
94 | 


--------------------------------------------------------------------------------
/requests/packages/urllib3/packages/__init__.py:
--------------------------------------------------------------------------------
1 | from __future__ import absolute_import
2 | 
3 | from . import ssl_match_hostname
4 | 
5 | 


--------------------------------------------------------------------------------
/requests/packages/urllib3/packages/ssl_match_hostname/__init__.py:
--------------------------------------------------------------------------------
 1 | try:
 2 |     # Python 3.2+
 3 |     from ssl import CertificateError, match_hostname
 4 | except ImportError:
 5 |     try:
 6 |         # Backport of the function from a pypi module
 7 |         from backports.ssl_match_hostname import CertificateError, match_hostname
 8 |     except ImportError:
 9 |         # Our vendored copy
10 |         from ._implementation import CertificateError, match_hostname
11 | 
12 | # Not needed, but documenting what we provide.
13 | __all__ = ('CertificateError', 'match_hostname')
14 | 


--------------------------------------------------------------------------------
/requests/packages/urllib3/packages/ssl_match_hostname/_implementation.py:
--------------------------------------------------------------------------------
  1 | """The match_hostname() function from Python 3.3.3, essential when using SSL."""
  2 | 
  3 | # Note: This file is under the PSF license as the code comes from the python
  4 | # stdlib.   http://docs.python.org/3/license.html
  5 | 
  6 | import re
  7 | 
  8 | __version__ = '3.4.0.2'
  9 | 
 10 | class CertificateError(ValueError):
 11 |     pass
 12 | 
 13 | 
 14 | def _dnsname_match(dn, hostname, max_wildcards=1):
 15 |     """Matching according to RFC 6125, section 6.4.3
 16 | 
 17 |     http://tools.ietf.org/html/rfc6125#section-6.4.3
 18 |     """
 19 |     pats = []
 20 |     if not dn:
 21 |         return False
 22 | 
 23 |     # Ported from python3-syntax:
 24 |     # leftmost, *remainder = dn.split(r'.')
 25 |     parts = dn.split(r'.')
 26 |     leftmost = parts[0]
 27 |     remainder = parts[1:]
 28 | 
 29 |     wildcards = leftmost.count('*')
 30 |     if wildcards > max_wildcards:
 31 |         # Issue #17980: avoid denials of service by refusing more
 32 |         # than one wildcard per fragment.  A survey of established
 33 |         # policy among SSL implementations showed it to be a
 34 |         # reasonable choice.
 35 |         raise CertificateError(
 36 |             "too many wildcards in certificate DNS name: " + repr(dn))
 37 | 
 38 |     # speed up common case w/o wildcards
 39 |     if not wildcards:
 40 |         return dn.lower() == hostname.lower()
 41 | 
 42 |     # RFC 6125, section 6.4.3, subitem 1.
 43 |     # The client SHOULD NOT attempt to match a presented identifier in which
 44 |     # the wildcard character comprises a label other than the left-most label.
 45 |     if leftmost == '*':
 46 |         # When '*' is a fragment by itself, it matches a non-empty dotless
 47 |         # fragment.
 48 |         pats.append('[^.]+')
 49 |     elif leftmost.startswith('xn--') or hostname.startswith('xn--'):
 50 |         # RFC 6125, section 6.4.3, subitem 3.
 51 |         # The client SHOULD NOT attempt to match a presented identifier
 52 |         # where the wildcard character is embedded within an A-label or
 53 |         # U-label of an internationalized domain name.
 54 |         pats.append(re.escape(leftmost))
 55 |     else:
 56 |         # Otherwise, '*' matches any dotless string, e.g. www*
 57 |         pats.append(re.escape(leftmost).replace(r'\*', '[^.]*'))
 58 | 
 59 |     # add the remaining fragments, ignore any wildcards
 60 |     for frag in remainder:
 61 |         pats.append(re.escape(frag))
 62 | 
 63 |     pat = re.compile(r'\A' + r'\.'.join(pats) + r'\Z', re.IGNORECASE)
 64 |     return pat.match(hostname)
 65 | 
 66 | 
 67 | def match_hostname(cert, hostname):
 68 |     """Verify that *cert* (in decoded format as returned by
 69 |     SSLSocket.getpeercert()) matches the *hostname*.  RFC 2818 and RFC 6125
 70 |     rules are followed, but IP addresses are not accepted for *hostname*.
 71 | 
 72 |     CertificateError is raised on failure. On success, the function
 73 |     returns nothing.
 74 |     """
 75 |     if not cert:
 76 |         raise ValueError("empty or no certificate")
 77 |     dnsnames = []
 78 |     san = cert.get('subjectAltName', ())
 79 |     for key, value in san:
 80 |         if key == 'DNS':
 81 |             if _dnsname_match(value, hostname):
 82 |                 return
 83 |             dnsnames.append(value)
 84 |     if not dnsnames:
 85 |         # The subject is only checked when there is no dNSName entry
 86 |         # in subjectAltName
 87 |         for sub in cert.get('subject', ()):
 88 |             for key, value in sub:
 89 |                 # XXX according to RFC 2818, the most specific Common Name
 90 |                 # must be used.
 91 |                 if key == 'commonName':
 92 |                     if _dnsname_match(value, hostname):
 93 |                         return
 94 |                     dnsnames.append(value)
 95 |     if len(dnsnames) > 1:
 96 |         raise CertificateError("hostname %r "
 97 |             "doesn't match either of %s"
 98 |             % (hostname, ', '.join(map(repr, dnsnames))))
 99 |     elif len(dnsnames) == 1:
100 |         raise CertificateError("hostname %r "
101 |             "doesn't match %r"
102 |             % (hostname, dnsnames[0]))
103 |     else:
104 |         raise CertificateError("no appropriate commonName or "
105 |             "subjectAltName fields were found")
106 | 


--------------------------------------------------------------------------------
/requests/packages/urllib3/util/__init__.py:
--------------------------------------------------------------------------------
 1 | # For backwards compatibility, provide imports that used to be here.
 2 | from .connection import is_connection_dropped
 3 | from .request import make_headers
 4 | from .response import is_fp_closed
 5 | from .ssl_ import (
 6 |     SSLContext,
 7 |     HAS_SNI,
 8 |     assert_fingerprint,
 9 |     resolve_cert_reqs,
10 |     resolve_ssl_version,
11 |     ssl_wrap_socket,
12 | )
13 | from .timeout import (
14 |     current_time,
15 |     Timeout,
16 | )
17 | 
18 | from .retry import Retry
19 | from .url import (
20 |     get_host,
21 |     parse_url,
22 |     split_first,
23 |     Url,
24 | )
25 | 


--------------------------------------------------------------------------------
/requests/packages/urllib3/util/connection.py:
--------------------------------------------------------------------------------
 1 | import socket
 2 | try:
 3 |     from select import poll, POLLIN
 4 | except ImportError:  # `poll` doesn't exist on OSX and other platforms
 5 |     poll = False
 6 |     try:
 7 |         from select import select
 8 |     except ImportError:  # `select` doesn't exist on AppEngine.
 9 |         select = False
10 | 
11 | 
12 | def is_connection_dropped(conn):  # Platform-specific
13 |     """
14 |     Returns True if the connection is dropped and should be closed.
15 | 
16 |     :param conn:
17 |         :class:`httplib.HTTPConnection` object.
18 | 
19 |     Note: For platforms like AppEngine, this will always return ``False`` to
20 |     let the platform handle connection recycling transparently for us.
21 |     """
22 |     sock = getattr(conn, 'sock', False)
23 |     if sock is False:  # Platform-specific: AppEngine
24 |         return False
25 |     if sock is None:  # Connection already closed (such as by httplib).
26 |         return True
27 | 
28 |     if not poll:
29 |         if not select:  # Platform-specific: AppEngine
30 |             return False
31 | 
32 |         try:
33 |             return select([sock], [], [], 0.0)[0]
34 |         except socket.error:
35 |             return True
36 | 
37 |     # This version is better on platforms that support it.
38 |     p = poll()
39 |     p.register(sock, POLLIN)
40 |     for (fno, ev) in p.poll(0.0):
41 |         if fno == sock.fileno():
42 |             # Either data is buffered (bad), or the connection is dropped.
43 |             return True
44 | 
45 | 
46 | # This function is copied from socket.py in the Python 2.7 standard
47 | # library test suite. Added to its signature is only `socket_options`.
48 | def create_connection(address, timeout=socket._GLOBAL_DEFAULT_TIMEOUT,
49 |                       source_address=None, socket_options=None):
50 |     """Connect to *address* and return the socket object.
51 | 
52 |     Convenience function.  Connect to *address* (a 2-tuple ``(host,
53 |     port)``) and return the socket object.  Passing the optional
54 |     *timeout* parameter will set the timeout on the socket instance
55 |     before attempting to connect.  If no *timeout* is supplied, the
56 |     global default timeout setting returned by :func:`getdefaulttimeout`
57 |     is used.  If *source_address* is set it must be a tuple of (host, port)
58 |     for the socket to bind as a source address before making the connection.
59 |     An host of '' or port 0 tells the OS to use the default.
60 |     """
61 | 
62 |     host, port = address
63 |     err = None
64 |     for res in socket.getaddrinfo(host, port, 0, socket.SOCK_STREAM):
65 |         af, socktype, proto, canonname, sa = res
66 |         sock = None
67 |         try:
68 |             sock = socket.socket(af, socktype, proto)
69 | 
70 |             # If provided, set socket level options before connecting.
71 |             # This is the only addition urllib3 makes to this function.
72 |             _set_socket_options(sock, socket_options)
73 | 
74 |             if timeout is not socket._GLOBAL_DEFAULT_TIMEOUT:
75 |                 sock.settimeout(timeout)
76 |             if source_address:
77 |                 sock.bind(source_address)
78 |             sock.connect(sa)
79 |             return sock
80 | 
81 |         except socket.error as _:
82 |             err = _
83 |             if sock is not None:
84 |                 sock.close()
85 |                 sock = None
86 | 
87 |     if err is not None:
88 |         raise err
89 |     else:
90 |         raise socket.error("getaddrinfo returns an empty list")
91 | 
92 | 
93 | def _set_socket_options(sock, options):
94 |     if options is None:
95 |         return
96 | 
97 |     for opt in options:
98 |         sock.setsockopt(*opt)
99 | 


--------------------------------------------------------------------------------
/requests/packages/urllib3/util/request.py:
--------------------------------------------------------------------------------
 1 | from base64 import b64encode
 2 | 
 3 | from ..packages.six import b
 4 | 
 5 | ACCEPT_ENCODING = 'gzip,deflate'
 6 | 
 7 | 
 8 | def make_headers(keep_alive=None, accept_encoding=None, user_agent=None,
 9 |                  basic_auth=None, proxy_basic_auth=None, disable_cache=None):
10 |     """
11 |     Shortcuts for generating request headers.
12 | 
13 |     :param keep_alive:
14 |         If ``True``, adds 'connection: keep-alive' header.
15 | 
16 |     :param accept_encoding:
17 |         Can be a boolean, list, or string.
18 |         ``True`` translates to 'gzip,deflate'.
19 |         List will get joined by comma.
20 |         String will be used as provided.
21 | 
22 |     :param user_agent:
23 |         String representing the user-agent you want, such as
24 |         "python-urllib3/0.6"
25 | 
26 |     :param basic_auth:
27 |         Colon-separated username:password string for 'authorization: basic ...'
28 |         auth header.
29 | 
30 |     :param proxy_basic_auth:
31 |         Colon-separated username:password string for 'proxy-authorization: basic ...'
32 |         auth header.
33 | 
34 |     :param disable_cache:
35 |         If ``True``, adds 'cache-control: no-cache' header.
36 | 
37 |     Example::
38 | 
39 |         >>> make_headers(keep_alive=True, user_agent="Batman/1.0")
40 |         {'connection': 'keep-alive', 'user-agent': 'Batman/1.0'}
41 |         >>> make_headers(accept_encoding=True)
42 |         {'accept-encoding': 'gzip,deflate'}
43 |     """
44 |     headers = {}
45 |     if accept_encoding:
46 |         if isinstance(accept_encoding, str):
47 |             pass
48 |         elif isinstance(accept_encoding, list):
49 |             accept_encoding = ','.join(accept_encoding)
50 |         else:
51 |             accept_encoding = ACCEPT_ENCODING
52 |         headers['accept-encoding'] = accept_encoding
53 | 
54 |     if user_agent:
55 |         headers['user-agent'] = user_agent
56 | 
57 |     if keep_alive:
58 |         headers['connection'] = 'keep-alive'
59 | 
60 |     if basic_auth:
61 |         headers['authorization'] = 'Basic ' + \
62 |             b64encode(b(basic_auth)).decode('utf-8')
63 | 
64 |     if proxy_basic_auth:
65 |         headers['proxy-authorization'] = 'Basic ' + \
66 |             b64encode(b(proxy_basic_auth)).decode('utf-8')
67 | 
68 |     if disable_cache:
69 |         headers['cache-control'] = 'no-cache'
70 | 
71 |     return headers
72 | 


--------------------------------------------------------------------------------
/requests/packages/urllib3/util/response.py:
--------------------------------------------------------------------------------
 1 | def is_fp_closed(obj):
 2 |     """
 3 |     Checks whether a given file-like object is closed.
 4 | 
 5 |     :param obj:
 6 |         The file-like object to check.
 7 |     """
 8 | 
 9 |     try:
10 |         # Check via the official file-like-object way.
11 |         return obj.closed
12 |     except AttributeError:
13 |         pass
14 | 
15 |     try:
16 |         # Check if the object is a container for another file-like object that
17 |         # gets released on exhaustion (e.g. HTTPResponse).
18 |         return obj.fp is None
19 |     except AttributeError:
20 |         pass
21 | 
22 |     raise ValueError("Unable to determine whether fp is closed.")
23 | 


--------------------------------------------------------------------------------
/requests/status_codes.py:
--------------------------------------------------------------------------------
 1 | # -*- coding: utf-8 -*-
 2 | 
 3 | from .structures import LookupDict
 4 | 
 5 | _codes = {
 6 | 
 7 |     # Informational.
 8 |     100: ('continue',),
 9 |     101: ('switching_protocols',),
10 |     102: ('processing',),
11 |     103: ('checkpoint',),
12 |     122: ('uri_too_long', 'request_uri_too_long'),
13 |     200: ('ok', 'okay', 'all_ok', 'all_okay', 'all_good', '\\o/', '✓'),
14 |     201: ('created',),
15 |     202: ('accepted',),
16 |     203: ('non_authoritative_info', 'non_authoritative_information'),
17 |     204: ('no_content',),
18 |     205: ('reset_content', 'reset'),
19 |     206: ('partial_content', 'partial'),
20 |     207: ('multi_status', 'multiple_status', 'multi_stati', 'multiple_stati'),
21 |     208: ('already_reported',),
22 |     226: ('im_used',),
23 | 
24 |     # Redirection.
25 |     300: ('multiple_choices',),
26 |     301: ('moved_permanently', 'moved', '\\o-'),
27 |     302: ('found',),
28 |     303: ('see_other', 'other'),
29 |     304: ('not_modified',),
30 |     305: ('use_proxy',),
31 |     306: ('switch_proxy',),
32 |     307: ('temporary_redirect', 'temporary_moved', 'temporary'),
33 |     308: ('permanent_redirect',
34 |           'resume_incomplete', 'resume',), # These 2 to be removed in 3.0
35 | 
36 |     # Client Error.
37 |     400: ('bad_request', 'bad'),
38 |     401: ('unauthorized',),
39 |     402: ('payment_required', 'payment'),
40 |     403: ('forbidden',),
41 |     404: ('not_found', '-o-'),
42 |     405: ('method_not_allowed', 'not_allowed'),
43 |     406: ('not_acceptable',),
44 |     407: ('proxy_authentication_required', 'proxy_auth', 'proxy_authentication'),
45 |     408: ('request_timeout', 'timeout'),
46 |     409: ('conflict',),
47 |     410: ('gone',),
48 |     411: ('length_required',),
49 |     412: ('precondition_failed', 'precondition'),
50 |     413: ('request_entity_too_large',),
51 |     414: ('request_uri_too_large',),
52 |     415: ('unsupported_media_type', 'unsupported_media', 'media_type'),
53 |     416: ('requested_range_not_satisfiable', 'requested_range', 'range_not_satisfiable'),
54 |     417: ('expectation_failed',),
55 |     418: ('im_a_teapot', 'teapot', 'i_am_a_teapot'),
56 |     422: ('unprocessable_entity', 'unprocessable'),
57 |     423: ('locked',),
58 |     424: ('failed_dependency', 'dependency'),
59 |     425: ('unordered_collection', 'unordered'),
60 |     426: ('upgrade_required', 'upgrade'),
61 |     428: ('precondition_required', 'precondition'),
62 |     429: ('too_many_requests', 'too_many'),
63 |     431: ('header_fields_too_large', 'fields_too_large'),
64 |     444: ('no_response', 'none'),
65 |     449: ('retry_with', 'retry'),
66 |     450: ('blocked_by_windows_parental_controls', 'parental_controls'),
67 |     451: ('unavailable_for_legal_reasons', 'legal_reasons'),
68 |     499: ('client_closed_request',),
69 | 
70 |     # Server Error.
71 |     500: ('internal_server_error', 'server_error', '/o\\', '✗'),
72 |     501: ('not_implemented',),
73 |     502: ('bad_gateway',),
74 |     503: ('service_unavailable', 'unavailable'),
75 |     504: ('gateway_timeout',),
76 |     505: ('http_version_not_supported', 'http_version'),
77 |     506: ('variant_also_negotiates',),
78 |     507: ('insufficient_storage',),
79 |     509: ('bandwidth_limit_exceeded', 'bandwidth'),
80 |     510: ('not_extended',),
81 | }
82 | 
83 | codes = LookupDict(name='status_codes')
84 | 
85 | for (code, titles) in list(_codes.items()):
86 |     for title in titles:
87 |         setattr(codes, title, code)
88 |         if not title.startswith('\\'):
89 |             setattr(codes, title.upper(), code)
90 | 


--------------------------------------------------------------------------------
/requests/structures.py:
--------------------------------------------------------------------------------
  1 | # -*- coding: utf-8 -*-
  2 | 
  3 | """
  4 | requests.structures
  5 | ~~~~~~~~~~~~~~~~~~~
  6 | 
  7 | Data structures that power Requests.
  8 | 
  9 | """
 10 | 
 11 | import collections
 12 | 
 13 | 
 14 | class CaseInsensitiveDict(collections.MutableMapping):
 15 |     """
 16 |     A case-insensitive ``dict``-like object.
 17 | 
 18 |     Implements all methods and operations of
 19 |     ``collections.MutableMapping`` as well as dict's ``copy``. Also
 20 |     provides ``lower_items``.
 21 | 
 22 |     All keys are expected to be strings. The structure remembers the
 23 |     case of the last key to be set, and ``iter(instance)``,
 24 |     ``keys()``, ``items()``, ``iterkeys()``, and ``iteritems()``
 25 |     will contain case-sensitive keys. However, querying and contains
 26 |     testing is case insensitive::
 27 | 
 28 |         cid = CaseInsensitiveDict()
 29 |         cid['Accept'] = 'application/json'
 30 |         cid['aCCEPT'] == 'application/json'  # True
 31 |         list(cid) == ['Accept']  # True
 32 | 
 33 |     For example, ``headers['content-encoding']`` will return the
 34 |     value of a ``'Content-Encoding'`` response header, regardless
 35 |     of how the header name was originally stored.
 36 | 
 37 |     If the constructor, ``.update``, or equality comparison
 38 |     operations are given keys that have equal ``.lower()``s, the
 39 |     behavior is undefined.
 40 | 
 41 |     """
 42 |     def __init__(self, data=None, **kwargs):
 43 |         self._store = dict()
 44 |         if data is None:
 45 |             data = {}
 46 |         self.update(data, **kwargs)
 47 | 
 48 |     def __setitem__(self, key, value):
 49 |         # Use the lowercased key for lookups, but store the actual
 50 |         # key alongside the value.
 51 |         self._store[key.lower()] = (key, value)
 52 | 
 53 |     def __getitem__(self, key):
 54 |         return self._store[key.lower()][1]
 55 | 
 56 |     def __delitem__(self, key):
 57 |         del self._store[key.lower()]
 58 | 
 59 |     def __iter__(self):
 60 |         return (casedkey for casedkey, mappedvalue in self._store.values())
 61 | 
 62 |     def __len__(self):
 63 |         return len(self._store)
 64 | 
 65 |     def lower_items(self):
 66 |         """Like iteritems(), but with all lowercase keys."""
 67 |         return (
 68 |             (lowerkey, keyval[1])
 69 |             for (lowerkey, keyval)
 70 |             in self._store.items()
 71 |         )
 72 | 
 73 |     def __eq__(self, other):
 74 |         if isinstance(other, collections.Mapping):
 75 |             other = CaseInsensitiveDict(other)
 76 |         else:
 77 |             return NotImplemented
 78 |         # Compare insensitively
 79 |         return dict(self.lower_items()) == dict(other.lower_items())
 80 | 
 81 |     # Copy is required
 82 |     def copy(self):
 83 |         return CaseInsensitiveDict(self._store.values())
 84 | 
 85 |     def __repr__(self):
 86 |         return str(dict(self.items()))
 87 | 
 88 | class LookupDict(dict):
 89 |     """Dictionary lookup object."""
 90 | 
 91 |     def __init__(self, name=None):
 92 |         self.name = name
 93 |         super(LookupDict, self).__init__()
 94 | 
 95 |     def __repr__(self):
 96 |         return '<lookup \'%s\'>' % (self.name)
 97 | 
 98 |     def __getitem__(self, key):
 99 |         # We allow fall-through here, so values default to None
100 | 
101 |         return self.__dict__.get(key, None)
102 | 
103 |     def get(self, key, default=None):
104 |         return self.__dict__.get(key, default)
105 | 


--------------------------------------------------------------------------------
/shrunkeninline.html:
--------------------------------------------------------------------------------
 1 | <style>
 2 | div {margin:0px;}
 3 | iframe {border:0; position: absolute;
 4 |   top:0;
 5 |   left: 0; width:200%; height:200%;
 6 |   transform: scale(.5);
 7 | transform-origin: top left;
 8 | }
 9 | </style>
10 | <div>
11 | <iframe sandbox="allow-same-origin allow-scripts" seamless src ="{{url}}"  >{{url}}</iframe></a>
12 | </div>
13 | {% endautoescape %}


--------------------------------------------------------------------------------
/shrunkensite.html:
--------------------------------------------------------------------------------
 1 | <!DOCTYPE html>
 2 | {% autoescape true %}
 3 | <html>
 4 | <head><title>hovercard test</title>
 5 | <meta charset="utf-8">
 6 | <meta name="mobile-web-app-capable" content="yes" />
 7 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 8 | <style>
 9 | body {margin:0px;}
10 | iframe {border:0; position: absolute;
11 |   top:0;
12 |   left: 0; width:200%; height:200%;
13 |   transform: scale(.5);
14 | transform-origin: top left;
15 | }
16 | </style>
17 | </head>
18 |   <body>
19 | <iframe sandbox="allow-same-origin allow-scripts" seamless src ="{{url}}"  >{{url}}</iframe></a>
20 | </body>
21 | </html>
22 | {% endautoescape %}


--------------------------------------------------------------------------------
/sparkline.html:
--------------------------------------------------------------------------------
 1 | <html>
 2 | <head><title>{{name}}</title>
 3 | <meta charset="utf-8">
 4 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 5 | </head>
 6 | <body>
 7 | <embed src="http://kevinmarks.com/sparkline.svg?{% for entry in entries %}{{entry}},{% endfor %}" width=200 height=15 >
 8 | 
 9 | </body>
10 | </html>


--------------------------------------------------------------------------------
/static/fragmention.js:
--------------------------------------------------------------------------------
 1 | 'use strict';
 2 | 
 3 | // detect native/existing fragmention support
 4 | if (!('fragmention' in window.location)) (function () {
 5 | 	// populate fragmention
 6 | 	location.fragmention = location.fragmention || '';
 7 | 
 8 | 	// return first element in scope containing case-sensitive text 
 9 | 	function getElementsByText(scope, text) {
10 | 		// iterate descendants of scope
11 | 		for (var all = scope.childNodes, index = 0, element, list = []; (element = all[index]); ++index) {
12 | 			// conditionally return element containing visible, whitespace-insensitive, case-sensitive text (a match)
13 | 			if (element.nodeType == 1 && (element.innerText || element.textContent || '').replace(/\s+/g, ' ').indexOf(text) !== -1) {
14 | 				list = list.concat(getElementsByText(element, text));
15 | 			}
16 | 		}
17 | 
18 | 		// return scope (no match)
19 | 		return list.length ? list : scope;
20 | 	}
21 | 
22 | 	// on dom ready or hash change
23 | 	function onHashChange() {
24 | 		// set location fragmention as uri-decoded text (from href, as hash may be decoded)
25 | 		var
26 | 		id = location.href.match(/#(#|%23)?(.+)/) || [0,'',''],
27 | 		node = document.getElementById(id[1]+id[2]),
28 | 		match = decodeURIComponent(id[2]).replace(/\+/g, ' ').split('  ');
29 | 
30 | 		location.fragmention = match[0];
31 | 		location.fragmentionIndex = parseFloat(match[1]) || 0;
32 | 
33 | 		// conditionally remove stashed element fragmention attribute
34 | 		if (element) {
35 | 			element.removeAttribute('fragmention');
36 | 
37 | 			// DEPRECATED: trigger style in IE8
38 | 			if (element.runtimeStyle) {
39 | 				element.runtimeStyle.windows = element.runtimeStyle.windows;
40 | 			}
41 | 		}
42 | 
43 | 		// if fragmention exists
44 | 		if (!node && location.fragmention) {
45 | 			var
46 | 			// get all elements containing text (or document)
47 | 			elements = getElementsByText(document, location.fragmention),
48 | 			// get total number of elements
49 | 			length   = elements.length,
50 | 			// get index of element
51 | 			modulus  = length && location.fragmentionIndex % length,
52 | 			index    = length && modulus >= 0 ? modulus : length + modulus;
53 | 
54 | 			// get element
55 | 			element = length && elements[index];
56 | 
57 | 			// if element found
58 | 			if (element) {
59 | 				// scroll to element
60 | 				element.scrollIntoView();
61 | 
62 | 				// set fragmention attribute
63 | 				element.setAttribute('fragmention', '');
64 | 
65 | 				// DEPRECATED: trigger style in IE8
66 | 				if (element.runtimeStyle) {
67 | 					element.runtimeStyle.windows = element.runtimeStyle.windows;
68 | 				}
69 | 			}
70 | 			// otherwise clear stashed element
71 | 			else {
72 | 				element = null;
73 | 			}
74 | 		}
75 | 	}
76 | 
77 | 	// set stashed element
78 | 	var element;
79 | 
80 | 	// add listeners
81 | 	if ('addEventListener' in window) {
82 | 		window.addEventListener('hashchange', onHashChange);
83 | 		document.addEventListener('DOMContentLoaded', onHashChange);
84 | 	}
85 | 	// DEPRECATED: otherwise use old IE attachEvent
86 | 	else {
87 | 		window.attachEvent('onhashchange', onHashChange);
88 | 		document.attachEvent('onreadystatechange', function () {
89 | 			if (document.readyState[0] === 'c') {
90 | 				onHashChange();
91 | 			}
92 | 		});
93 | 	}
94 | })();
95 | 


--------------------------------------------------------------------------------
/static/index.html:
--------------------------------------------------------------------------------
1 | Boo!


--------------------------------------------------------------------------------
/static/landscape.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/static/landscape.jpg


--------------------------------------------------------------------------------
/static/landscape2.jpg:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kevinmarks/unmung/5b8539971a8e1a64694e65643670936512fc987d/static/landscape2.jpg


--------------------------------------------------------------------------------
/storycard.html:
--------------------------------------------------------------------------------
 1 | <html>
 2 | <head><title>{{name}}</title>
 3 | <meta charset="utf-8">
 4 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 5 | <link href="styles/storycard.css" media="all" rel="stylesheet" type="text/css" />
 6 | </head>
 7 | <body>
 8 | <ul class="storycards">{% if entries %}
 9 | {% for entry in entries %}
10 | <li class="card"><div class="h-entry"><a href="{{entry.url}}">
11 | {% if entry.featured %}
12 | <img class="u-featured" src="{{entry.featured}}" />
13 | {% elif  entry.photo %}
14 | <img class="u-photo" src="{{entry.photo}}" />
15 | {% endif %}
16 | <h3 class="p-name">{{entry.name}}</h3></a>
17 | <p class="p-summary">{{entry.summary}}</p>
18 | <time class="dt-published" datetime={{entry.published}}></time>
19 | </div>
20 | {% endfor %}
21 | {% endif %}
22 | </ul>
23 | </body>
24 | </html>


--------------------------------------------------------------------------------
/styles/awesomplete.css:
--------------------------------------------------------------------------------
  1 | .awesomplete [hidden] {
  2 |     display: none;
  3 | }
  4 | 
  5 | .awesomplete .visually-hidden {
  6 |     position: absolute;
  7 |     clip: rect(0, 0, 0, 0);
  8 | }
  9 | 
 10 | .awesomplete {
 11 |     display: inline-block;
 12 |     position: relative;
 13 | }
 14 | 
 15 | .awesomplete > input {
 16 |     display: block;
 17 | }
 18 | 
 19 | .awesomplete > ul {
 20 |     position: absolute;
 21 |     left: 0;
 22 |     z-index: 1;
 23 |     min-width: 100%;
 24 |     box-sizing: border-box;
 25 |     list-style: none;
 26 |     padding: 0;
 27 |     margin: 0;
 28 |     background: #fff;
 29 | }
 30 | 
 31 | .awesomplete > ul:empty {
 32 |     display: none;
 33 | }
 34 | 
 35 | .awesomplete > ul {
 36 | 	border-radius: .3em;
 37 | 	margin: .2em 0 0;
 38 | 	background: hsla(0,0%,100%,.9);
 39 | 	background: linear-gradient(to bottom right, white, hsla(0,0%,100%,.8));
 40 | 	border: 1px solid rgba(0,0,0,.3);
 41 | 	box-shadow: .05em .2em .6em rgba(0,0,0,.2);
 42 | 	text-shadow: none;
 43 | }
 44 | 
 45 | @supports (transform: scale(0)) {
 46 | 	.awesomplete > ul {
 47 | 		transition: .3s cubic-bezier(.4,.2,.5,1.4);
 48 | 		transform-origin: 1.43em -.43em;
 49 | 	}
 50 | 	
 51 | 	.awesomplete > ul[hidden],
 52 | 	.awesomplete > ul:empty {
 53 | 		opacity: 0;
 54 | 		transform: scale(0);
 55 | 		display: block;
 56 | 		transition-timing-function: ease;
 57 | 	}
 58 | }
 59 | 
 60 | 	/* Pointer */
 61 | 	.awesomplete > ul:before {
 62 | 		content: "";
 63 | 		position: absolute;
 64 | 		top: -.43em;
 65 | 		left: 1em;
 66 | 		width: 0; height: 0;
 67 | 		padding: .4em;
 68 | 		background: white;
 69 | 		border: inherit;
 70 | 		border-right: 0;
 71 | 		border-bottom: 0;
 72 | 		-webkit-transform: rotate(45deg);
 73 | 		transform: rotate(45deg);
 74 | 	}
 75 | 
 76 | 	.awesomplete > ul > li {
 77 | 		position: relative;
 78 | 		padding: .2em .5em;
 79 | 		cursor: pointer;
 80 | 	}
 81 | 	
 82 | 	.awesomplete > ul > li:hover {
 83 | 		background: hsl(200, 40%, 80%);
 84 | 		color: black;
 85 | 	}
 86 | 	
 87 | 	.awesomplete > ul > li[aria-selected="true"] {
 88 | 		background: hsl(205, 40%, 40%);
 89 | 		color: white;
 90 | 	}
 91 | 	
 92 | 		.awesomplete mark {
 93 | 			background: hsl(65, 100%, 50%);
 94 | 		}
 95 | 		
 96 | 		.awesomplete li:hover mark {
 97 | 			background: hsl(68, 100%, 41%);
 98 | 		}
 99 | 		
100 | 		.awesomplete li[aria-selected="true"] mark {
101 | 			background: hsl(86, 100%, 21%);
102 | 			color: inherit;
103 | 		}
104 | /*# sourceMappingURL=awesomplete.css.map */
105 | 


--------------------------------------------------------------------------------
/styles/hfeed.css:
--------------------------------------------------------------------------------
 1 | [fragmention] { background-color: gold; outline: 0.375em solid gold; }
 2 | body {font-family: "Hoefler Text", Georgia, serif; background-color: white; max-width: 40em;}
 3 | .h-card, .webmention-author { font-family: "Gill Sans", Roboto,Verdana, sans-serif; }
 4 | h1,h2,h3,summary,dt { font-family: "Gill Sans", Roboto,Verdana, sans-serif; font-weight: bold;}
 5 | .h-card .u-photo {height:2em;}
 6 | figure {margin-left:2.5%; margin-right:2.5%;}
 7 | .figure img {max-width:95%;}
 8 | img,audio,video {max-width:95%;}
 9 | img,audio,video {max-width:95vw;}
10 | blockquote.auto-mention {font-size:.9em; border: 1px solid lightgray; border-radius: 4px; max-width: 25em; padding: .9em; }
11 | blockquote.auto-mention cite {font-style:normal; font-weight:bold;}
12 | blockquote.auto-mention p {margin:0;}
13 | blockquote.auto-mention a {text-decoration:none; color:black;}
14 | 
15 | .u-photo {maxwidth:100%;}
16 | .indiecard {border: 1px solid lightgray; border-radius: 4px; max-width: 25em; padding: .9em; }
17 | .indiecard.figure {float:left; width 50%;}
18 | 
19 | details summary::-webkit-details-marker {
20 |   font-size: 40px;
21 | }
22 | 


--------------------------------------------------------------------------------
/styles/hovercard.css:
--------------------------------------------------------------------------------
 1 | body {margin:0; font-family: "Gill Sans", Roboto,Verdana, sans-serif;}
 2 | .indiecard {display: -webkit-flex; display:flex; 
 3 |             -webkit-flex-direction: column; flex-direction: column; 
 4 |             margin:0; width:100%; height:100%; padding: 0; 
 5 |             position:fixed; overflow:hidden;}
 6 | h1 {display: -webkit-flex; display:flex; 
 7 |     -webkit-align-items:center; align-items:center;
 8 |     font-size:20vh; margin:0;
 9 |     -webkit-flex-shrink:1; flex-shrink:1;}
10 | h2 {display: -webkit-flex; display:flex; 
11 |     font-weight: 300; margin:0; 
12 |     -webkit-flex-grow:2; flex-grow:2; font-size:5vw;}
13 | text {font-size:20vh;}
14 | a { text-decoration:none;}
15 | .figure {-webkit-flex-grow:1; flex-grow:1; max-width:20%; height:100%;}
16 | .u-photo {width:100%; max-height:100%; object-fit: contain;
17 |         position: relative; top: 50%; transform: translateY(-50%);}
18 | .p-name {-webkit-flex-grow:4; flex-grow:4; }


--------------------------------------------------------------------------------
/styles/hovercard2.css:
--------------------------------------------------------------------------------
 1 | body {margin:0; font-family: "Gill Sans", Roboto,Verdana, sans-serif;}
 2 | .indiecard { display: -webkit-flex; display:flex;
 3 |             -webkit-flex-direction: column; flex-direction: column;
 4 |             -webkit-align-items: stretch; align-items: stretch;
 5 |             margin:0; width:100%; height:100%; padding: 0; overflow:hidden;
 6 |             font-size:3vw;
 7 |             }
 8 | .u-banner {height:30vh;}
 9 | .u-banner img {width:100%; height:100%; object-fit: cover;}
10 | h1 {display: -webkit-flex; display:flex; 
11 |     -webkit-align-items:center; align-items:center;
12 |     font-size:20vh; margin:0;height:25vh;
13 |     }
14 | text {font-size:20vh;}
15 | a { text-decoration:none;}
16 | .figure {-webkit-flex-grow:1; flex-grow:1;  max-width:20%; height:100%;}
17 | .u-featured {height:3em; float:left;}
18 | .u-featured img {width:100%; height:100%; object-fit: cover;}
19 | .u-photo {width:100%; max-height:100%; object-fit: contain;
20 |         }
21 | .p-name {-webkit-flex-grow:4; flex-grow:4; } 
22 | h2 { 
23 |     font-weight: 300; margin:0; 
24 |     font-size:4vh;
25 |     }
26 | .h-entry {margin-left: 10vw; margin-bottom:4vh; max-height:20vh}
27 | h3 { 
28 |     font-weight: 400; margin:0; 
29 |     font-size:7vh;
30 |     text-overflow: ellipsis;
31 |     overflow: hidden;
32 |     max-height:16vh;
33 |     }
34 | p { margin:0;}
35 | 
36 | 


--------------------------------------------------------------------------------
/styles/indiecard.css:
--------------------------------------------------------------------------------
  1 | 
  2 | * { font-family: 'Gill Sans','Roboto', sans-serif; line-height:1.2; vertical-align:middle; }
  3 | 
  4 | body { background:#222; display:flex; max-width:inherit; flex-direction: column;}
  5 | 
  6 | 
  7 | main,footer {
  8 |   display:flex;
  9 |   flex-wrap: wrap;
 10 |   justify-content: space-around;
 11 |   margin:3vh auto;
 12 |   padding:1.5rem 0 0;
 13 |   background:#d5d5d5;
 14 |   outline
 15 |   border-radius:.25rem;
 16 |   overflow:hidden;
 17 | }
 18 | header {
 19 |   z-index:0;
 20 |   height:10rem;
 21 |   transition:transform .5s, opacity .3s;
 22 |   background:url(/static/landscape.jpg)  center center;
 23 |   background-size:cover;
 24 | }
 25 | 
 26 | input, .indiecard {
 27 |   position:relative;
 28 |   z-index:2;
 29 | }
 30 | input {
 31 |   display:block;
 32 |   width:26rem;
 33 |   margin:4.5rem 1rem 2rem;
 34 |   border:0;
 35 |   font-size:1.2rem;
 36 |   padding:.75rem 1rem;
 37 |   border-radius:3px;
 38 |   box-shadow:0 1px 2px #aaa;
 39 |   transition:.5s, margin-bottom .15s;
 40 | }
 41 | 
 42 | input:focus {
 43 |   margin:0 1rem 1rem;
 44 |   outline:0;
 45 | }
 46 | 
 47 | input:focus + header {
 48 |   transform:translate3d(0,-10rem,0);
 49 |   opacity:0;
 50 | }
 51 | 
 52 | .indiecard {
 53 |   padding:1.5rem;
 54 |   box-shadow:0 1px 2px #aaa;
 55 |   background:white;
 56 |   width:100%;
 57 |   max-width:25em;
 58 |   margin:0 1rem 1rem;
 59 |   border-radius:3px;
 60 |   user-select:none;
 61 |   animation:fly-in-from-left .5s 1s ease both;
 62 |   transform-origin:top left;
 63 | }
 64 | .indiecard:nth-child(even){
 65 |   animation-name:fly-in-from-right;
 66 |   animation-delay:1.1s;
 67 |  transform-origin:top right;
 68 | }
 69 | 
 70 | @keyframes fly-in-from-left {
 71 |   from {
 72 |     transform:translateY(15rem) rotate(15deg);
 73 |     opacity:0;
 74 |   }
 75 | }
 76 | 
 77 | @keyframes fly-in-from-right {
 78 |   from {
 79 |     transform:translateY(15rem) rotate(-15deg);
 80 |     opacity:0;
 81 |   }
 82 | }
 83 | 
 84 | .indiecard:after {
 85 |   position:absolute;
 86 |   font-size:.9rem;
 87 |   top:1.5rem;
 88 |   right:1rem;
 89 |   content:"i";
 90 |   border:thin solid gray;
 91 |   color:gray;
 92 |   width:1rem;
 93 |   line-height:1rem;
 94 |   text-align:center;
 95 |   border-radius:50%;
 96 |   pointer-events:none;
 97 | }
 98 | a { text-decoration:none;
 99 | }
100 | h1 {
101 |   font-size:2rem;
102 |   font-weight:400;
103 | }
104 |   strong {
105 |     font-weight:300;
106 |     color:#539D00;
107 |   }
108 | 
109 | h2 {
110 |   font-size:1rem;
111 |   line-height:1.5;
112 |   color:black;
113 |   font-weight:400;
114 | }
115 | 
116 | .hidden {display:none;}
117 | 


--------------------------------------------------------------------------------
/styles/mastoview.css:
--------------------------------------------------------------------------------
 1 | [fragmention] { background-color: gold; outline: 0.375em solid gold; }
 2 | h1,h2,h3,dt { font-family: "Gill Sans", Roboto,Verdana, sans-serif; font-weight: bold;}
 3 | h1 {margin:0em;}
 4 | .top {display:flex; justify-content: space-around;flex-wrap: wrap; }
 5 | .h-card .u-photo {height:2em;}
 6 | figure {margin-left:2.5%; margin-right:2.5%;}
 7 | .figure img {max-width:95%;}
 8 | img,audio,video {max-width:95%;}
 9 | a { text-decoration:none;}
10 | input,select,button {font-size: 1.5em;}
11 | 
12 | .u-photo {maxwidth:100%;}
13 | 
14 | body {margin:0; font-family: "Gill Sans", Roboto,Verdana, sans-serif; background: cornsilk;}
15 | .entries {  display:flex; flex-wrap: wrap;
16 |              justify-content: space-around; 
17 |             font-size:1em;
18 |             }
19 | .entry {background: white;}
20 | .entry .header {font-weight:300;}
21 | .entry .header a { font-weight:600;}
22 | 
23 | .entry .header img {height: 3em; float: left;  margin: .25em;}
24 | .entry {width:20em; margin-bottom: 1em;}
25 | .entry .content {margin-left:3.5em;}
26 | .entry .content p:first-child {margin-top:0em;}
27 | .entry .footer {margin-left:3.5em;}
28 | display:flex; flex-direction: column;
29 |             justify-content: space-around; }
30 | li {list-style:none;}
31 | .card {width:240px; border:10px; max-height:360px; overflow:hidden; text-overflow: ellipsis;}
32 | h3 { 
33 |     font-weight: 400; 
34 |     font-size:1.5em;
35 |    }
36 | summary .showmore {
37 |     background: blue;
38 |     color: white;
39 |     text-transform: uppercase;
40 |     border-radius: .25em;
41 |     padding: .25em;
42 |     font-size: .75em;
43 | }


--------------------------------------------------------------------------------
/styles/storycard.css:
--------------------------------------------------------------------------------
 1 | body {margin:0; font-family: "Gill Sans", Roboto,Verdana, sans-serif;}
 2 | .storycards { display: -webkit-flex; display:flex; -webkit-flex-wrap: wrap; flex-wrap: wrap;
 3 |             -webkit-justify-content: space-around; justify-content: space-around; 
 4 |             font-size:.75em;
 5 |             }
 6 | img {width: 220px; object-fit: cover; max-height:220px;}
 7 | li {list-style:none;}
 8 | .card {width:240px; border:10px; max-height:360px; overflow:hidden; text-overflow: ellipsis;}
 9 | a { text-decoration:none;}
10 | h3 { 
11 |     font-weight: 400; 
12 |     font-size:1.5em;
13 |    }
14 | 


--------------------------------------------------------------------------------
/vrcard.html:
--------------------------------------------------------------------------------
 1 | <html>
 2 | <head><title>{{name}}</title>
 3 | <meta charset="utf-8">
 4 | <meta name="viewport" content="width=device-width, initial-scale=1.0">
 5 | <link href="styles/storycard.css" media="all" rel="stylesheet" type="text/css" />
 6 |     <script src="https://aframe.io/releases/0.3.0/aframe.min.js"></script>
 7 | </head>
 8 | <body>
 9 | <a-scene>
10 | {% if entries %}
11 | <a-assets>
12 | {% for entry in entries %}
13 | {% if entry.featured %}
14 | <img id="{{entry.id}}" src="{{entry.featured}}">
15 | {% elif  entry.photo %}
16 | <img id="{{entry.id}}" src="{{entry.photo}}">
17 | {% endif %}
18 | 
19 | {% endfor %}
20 | </a-assets>
21 | <ul class="storycards">
22 | {% for entry in entries %}
23 | <li class="card"><div class="h-entry"><a href="{{entry.url}}">
24 | {% if entry.featured %}
25 | <a-curvedimage src="#{{entry.id}}" radius="5.7" theta-length="180" height="9"
26 |              rotation="0 90 0" scale="1.2 1.2 1.2"></a-curvedimage>
27 | {% elif  entry.photo %}
28 | <a-curvedimage src="#{{entry.id}}" radius="5.7" theta-length="180" height="9"
29 |              rotation="0 90 0" scale="1.2 1.2 1.2"></a-curvedimage>
30 | {% endif %}
31 | <h3 class="p-name">{{entry.name}}</h3></a>
32 | <p class="p-summary">{{entry.summary}}</p>
33 | <time class="dt-published" datetime={{entry.published}}></time>
34 | </div>
35 | {% endfor %}
36 | {% endif %}
37 | </ul>
38 |       <a-sky color="#fff"></a-sky>
39 |       <a-entity position="0 0 1.5">
40 |         <a-camera></a-camera>
41 |       </a-entity>
42 |     </a-scene>
43 | </body>
44 | </html>
45 | 


--------------------------------------------------------------------------------
/xoxopodcast.xml:
--------------------------------------------------------------------------------
 1 | <?xml version="1.0" encoding="UTF-8"?>
 2 | <rss version="2.0" xmlns:media="http://search.yahoo.com/mrss/" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:itunes="http://www.itunes.com/dtds/podcast-1.0.dtd">
 3 | <channel><title>I'm Sorry I Haven't a Clue</title>
 4 | <description>I'm Sorry I Haven't a Clue full archive</description><itunes:summary>I'm Sorry I Haven't a Clue full archive</itunes:summary><itunes:author>BBC Radio 4</itunes:author><itunes:owner><itunes:name>BBC</itunes:name></itunes:owner><language>en</language><itunes:category text="Comedy"/><itunes:category text="Comedy"/><itunes:category text="Comedy"/><itunes:explicit>no</itunes:explicit><media:rating scheme="urn:simple">nonadult</media:rating>
 5 | {% for entry in entries %}
 6 | <item><title>{{entry.name}}</title>
 7 | <description>{{entry.content}}</description>
 8 | <itunes:subtitle>{{entry.summary}}</itunes:subtitle>
 9 | <itunes:summary>{{entry.content}}</itunes:summary>
10 | <pubDate>{{entry.date}}</pubDate>
11 | <enclosure url="{{entry.url}}"  type="audio/mpeg"/>
12 | <itunes:explicit>clean</itunes:explicit>
13 | <media:content url="{{entry.url}}" type="audio/mpeg" medium="audio" expression="full"/>
14 | <itunes:author>BBC Radio 4</itunes:author>
15 | </item>
16 | {% endfor %}
17 | </channel>
18 | </rss>


--------------------------------------------------------------------------------