├── .gitignore
├── .travis.yml
├── LICENSE.txt
├── MANIFEST
├── README.rst
├── extractcontent3
    ├── __init__.py
    └── extractcontent3.py
├── setup.py
└── tests
    ├── __init__.py
    ├── blog.html
    └── test_extractcontent3.py


/.gitignore:
--------------------------------------------------------------------------------
1 | *.pyc
2 | build/
3 | dist/
4 | 
5 | *.*~
6 | .python-version


--------------------------------------------------------------------------------
/.travis.yml:
--------------------------------------------------------------------------------
1 | language: python
2 | python:
3 |   - "3.6"
4 |   - "nightly"
5 | script:
6 |   - pytest
7 | 


--------------------------------------------------------------------------------
/LICENSE.txt:
--------------------------------------------------------------------------------
 1 | Copyright (c) 2007, Cybozu Labs Inc.
 2 | All rights reserved.
 3 | 
 4 | Redistribution and use in source and binary forms, with or without
 5 | modification, are permitted provided that the following conditions are met:
 6 | 
 7 | 1. Redistributions of source code must retain the above copyright notice,
 8 |    this list of conditions and the following disclaimer.
 9 | 2. Redistributions in binary form must reproduce the above copyright notice,
10 |    this list of conditions and the following disclaimer in the documentation
11 |    and/or other materials provided with the distribution.
12 | 
13 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
14 | ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
15 | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
16 | DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR
17 | ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
18 | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
19 | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
20 | ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
21 | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
22 | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
23 | 
24 | The views and conclusions contained in the software and documentation are those
25 | of the authors and should not be interpreted as representing official policies,
26 | either expressed or implied, of the FreeBSD Project.
27 | 


--------------------------------------------------------------------------------
/MANIFEST:
--------------------------------------------------------------------------------
1 | include *.txt
2 | recursive-include extractcontent *.txt *.py
3 | 


--------------------------------------------------------------------------------
/README.rst:
--------------------------------------------------------------------------------
 1 | ExtractContent3
 2 | ===============
 3 | 
 4 | .. image:: https://img.shields.io/pypi/v/extractcontent3.svg
 5 |     :target: https://pypi.python.org/pypi/extractcontent3
 6 | 
 7 | .. image:: https://img.shields.io/pypi/l/extractcontent3.svg
 8 |     :target: https://pypi.python.org/pypi/extractcontent3
 9 | 
10 | .. image:: https://img.shields.io/pypi/pyversions/extractcontent3.svg
11 |     :target: https://pypi.python.org/pypi/extractcontent3
12 | 
13 | .. image:: https://travis-ci.org/kanjirz50/python-extractcontent3.svg?branch=master
14 |     :target: https://travis-ci.org/kanjirz50/python-extractcontent3
15 | 
16 | ExtractContent3はPython3で動作する、HTMLから本文を抽出するモジュールです。
17 | このモジュールは、ExtractContent RubyモジュールをPython用に書き直したpython-extracontentを改造したものです。
18 | 
19 | Usage
20 | ------------
21 | 
22 | .. code-block:: python
23 | 
24 |    from extractcontent3 import ExtractContent
25 |    extractor = ExtractContent()
26 | 
27 |    # オプション値を指定する
28 |    opt = {"threshold":50}
29 |    extractor.set_option(opt)
30 | 
31 |    html = open("index.html").read() # 解析対象HTML
32 |    extractor.analyse(html)
33 |    text, title = extractor.as_text()
34 |    html, title = extractor.as_html()
35 |    title = extractor.extract_title(html)
36 | 
37 | Installation
38 | ------------
39 | 
40 | .. code-block:: bash
41 | 
42 |    # pypi
43 |    $ pip install extractcontent3
44 |    
45 |    # Githubからのインストール
46 |    $ pip install git+https://github.com/kanjirz50/python-extractcontent3
47 | 
48 | Option
49 | -------------
50 | 
51 | .. code-block:: python
52 | 
53 |    """
54 |    オプションの種類:
55 |    名称 / デフォルト値
56 |    
57 |    threshold / 100
58 |    本文と見なすスコアの閾値
59 | 
60 |    min_length / 80
61 |    評価を行うブロック長の最小値
62 | 
63 |    decay_factor / 0.73
64 |    減衰係数
65 |    小さいほど先頭に近いブロックのスコアが高くなります
66 | 
67 |    continuous_factor / 1.62
68 |    連続ブロック係数
69 |    大きいほどブロックを連続と判定しにくくなる
70 | 
71 |    punctuation_weight / 10
72 |    句読点に対するスコア　
73 |    大きいほど句読点が存在するブロックを本文と判定しやすくなる
74 | 
75 |    punctuations r"(?is)([\u3001\u3002\uff01\uff0c\uff0e\uff1f]|\.[^A-Za-z0-9]|,[^0-9]|!|\?)"    
76 |    句読点を抽出する正規表現
77 |     
78 |    waste_expressions / r"(?i)Copyright|All Rights Reserved"
79 |    フッターに含まれる特徴的なキーワードを指定した正規表現
80 | 
81 |    debug / False
82 |     Trueの場合、ブロック情報を出力
83 |    """
84 | 
85 | 謝辞
86 | ----
87 | 
88 | オリジナル版の作成者やForkで改良を加えた方々に感謝します。
89 | 
90 | - Copyright of the original implementation:: (c)2007/2008/2009 Nakatani Shuyo / Cybozu labs Inc. All rights reserved
91 |   - http://rubyforge.org/projects/extractcontent/
92 |   - http://labs.cybozu.co.jp/blog/nakatani/2007/09/web_1.html
93 | - https://github.com/petitviolet/python-extractcontent
94 | - https://github.com/yono/python-extractcontent
95 | 


--------------------------------------------------------------------------------
/extractcontent3/__init__.py:
--------------------------------------------------------------------------------
1 | from .extractcontent3 import ExtractContent
2 | 


--------------------------------------------------------------------------------
/extractcontent3/extractcontent3.py:
--------------------------------------------------------------------------------
  1 | #!/usr/bin/env python
  2 | 
  3 | import re
  4 | import unicodedata
  5 | from functools import reduce
  6 | 
  7 | 
  8 | class ExtractContent(object):
  9 | 
 10 |     # convert character to entity references
 11 |     CHARREF = {
 12 |         "nbsp": " ",
 13 |         "lt": "<",
 14 |         "gt": "<",
 15 |         "amp": "&",
 16 |         "laquo": "\x00\xab",
 17 |         "raquo": "\x00\xbb",
 18 |     }
 19 | 
 20 |     # Default option parameters.
 21 |     option = {
 22 |         "threshold": 100,
 23 |         # threshold for score of the text
 24 |         "min_length": 80,
 25 |         # minimum length of evaluated blocks
 26 |         "decay_factor": 0.73,
 27 |         # decay factor for block score
 28 |         "continuous_factor": 1.62,
 29 |         # continuous factor for block score
 30 |         # ( the larger, the harder to continue )
 31 |         "punctuation_weight": 10,
 32 |         # score weight for punctuations
 33 |         "punctuations": (r"(?is)([\u3001\u3002\uff01\uff0c\uff0e\uff1f]"
 34 |                          r"|\.[^A-Za-z0-9]|,[^0-9]|!|\?)"),
 35 |         # punctuation characters
 36 |         "waste_expressions": r"(?i)Copyright|All Rights Reserved",
 37 |         # characteristic keywords including footer
 38 |         "debug": False,
 39 |         # if true, output block information to stdout
 40 |     }
 41 | 
 42 |     def __init__(self, opt=None):
 43 |         if opt is not None:
 44 |             self.option.update(opt)
 45 |         self.title = ''
 46 |         self.body = ''
 47 | 
 48 |     def set_option(self, opt):
 49 |         """
 50 |         Sets option parameters to default.
 51 |         Parameter opt is given as Dictionary.
 52 |         """
 53 |         self.option.update(opt)
 54 | 
 55 |     def analyse(self, html, opt=None):
 56 |         """
 57 |         Analyses the given HTML text, extracts body and title.
 58 |         """
 59 |         # flameset or redirect
 60 |         if re.search((r"(?i)<\/frameset>|<meta\s+http-equiv\s*=\s*"
 61 |                       r"[\"']?refresh['\"]?[^>]*url"), html) is not None:
 62 |             return ["", self.extract_title(html)]
 63 | 
 64 |         # option parameters
 65 |         if opt:
 66 |             self.option.update(opt)
 67 | 
 68 |         # header & title
 69 |         header = re.match(r"(?s)</head\s*>", html)
 70 |         if header is not None:
 71 |             html = html[:header.end()]
 72 |             self.title = self.extract_title(html[0:header.start()])
 73 |         else:
 74 |             self.title = self.extract_title(html)
 75 | 
 76 |         # Google AdSense Section Target
 77 |         html = re.sub((r"(?is)<!--\s*google_ad_section_start\(weight="
 78 |                        r"ignore\)\s*-->.*?<!--\s*google_ad_section_end.*?-->"),
 79 |                       "", html)
 80 |         if re.search(r"(?is)<!--\s*google_ad_section_start[^>]*-->",
 81 |                      html) is not None:
 82 |             result = re.findall((r"(?is)<!--\s*google_ad_section_start"
 83 |                                  r"[^>]*-->.*?<!--\s*google_ad_section_end.*?-->"),
 84 |                                 html)
 85 |             html = "\n".join(result)
 86 | 
 87 |         # eliminate useless text
 88 |         html = self._eliminate_useless_tags(html)
 89 | 
 90 |         # heading tags including title
 91 |         # self.title = title
 92 |         html = re.sub(r"(?s)(<h\d\s*>\s*(.*?)\s*</h\d\s*>)",
 93 |                       self._estimate_title, html)
 94 | 
 95 |         # extract text blocks
 96 |         factor = 1.0
 97 |         continuous = 1.0
 98 |         body = ''
 99 |         score = 0
100 |         bodylist = []
101 |         block_list = self._split_to_blocks(html)
102 |         for block in block_list:
103 |             if self._has_only_tags(block):
104 |                 continue
105 | 
106 |             if len(body) > 0:
107 |                 continuous /= self.option["continuous_factor"]
108 | 
109 |             # ignore link list block
110 |             notlinked = self._eliminate_link(block)
111 |             if len(notlinked) < self.option["min_length"]:
112 |                 continue
113 | 
114 |             # calculate score of block
115 |             c = (len(notlinked) + self._count_pattern(notlinked, self.option["punctuations"]) * self.option["punctuation_weight"]) * factor
116 |             factor *= self.option["decay_factor"]
117 |             not_body_rate = self._count_pattern(block, self.option["waste_expressions"]) + self._count_pattern(block, r"amazon[a-z0-9\.\/\-\?&]+-22") / 2.0
118 |             if not_body_rate > 0:
119 |                 c *= (0.72 ** not_body_rate)
120 |             c1 = c * continuous
121 |             if self.option["debug"]:
122 |                 print("----- %f*%f=%f %d \n%s" % (c, continuous, c1, len(notlinked),
123 |                                                   self._strip_tags(block)[0:100]))
124 | 
125 |             # tread continuous blocks as cluster
126 |             if c1 > self.option["threshold"]:
127 |                 body += block + "\n"
128 |                 score += c1
129 |                 continuous = self.option["continuous_factor"]
130 |             elif c > self.option["threshold"]:  # continuous block end
131 |                 bodylist.append((body, score))
132 |                 body = block + "\n"
133 |                 score = c
134 |                 continuous = self.option["continuous_factor"]
135 | 
136 |         bodylist.append((body, score))
137 |         body = reduce(lambda x, y: x if x[1] >= y[1] else y, bodylist)
138 |         self.body = body[0]
139 |         return self.as_text()
140 | 
141 |     def as_html(self):
142 |         return (self.body, self.title)
143 | 
144 |     def as_text(self):
145 |         return (self._strip_tags(self.body), self.title)
146 | 
147 |     def extract_title(self, st):
148 |         result = re.search(r"(?s)<title[^>]*>\s*(.*?)\s*</title\s*>", st)
149 |         if result is not None:
150 |             return self._strip_tags(result.group(0))
151 |         else:
152 |             return ""
153 | 
154 |     def _split_to_blocks(self, html):
155 |         block_list = \
156 |             re.split((r"</?(?:div|center|td)[^>]*>|<p\s*[^>]*class\s*=\s*"
157 |                       r"[\"']?(?:posted|plugin-\w+)['\"]?[^>]*>"), html)
158 |         return block_list
159 | 
160 |     # Count a pattern from text.
161 |     def _count_pattern(self, text, pattern):
162 |         result = re.search(pattern, text)
163 |         if result is None:
164 |             return 0
165 |         else:
166 |             return len(result.span())
167 | 
168 |     def _estimate_title(self, match):
169 |         """
170 |         h? タグの記述がタイトルと同じかどうか調べる
171 |         """
172 |         striped = self._strip_tags(match.group(2))
173 |         if len(striped) >= 3 and self.title.find(striped) != -1:
174 |             return "<div>%s</div>" % (striped)
175 |         else:
176 |             return match.group(1)
177 | 
178 |     def _eliminate_useless_tags(self, html):
179 |         """
180 |         Eliminates useless tags
181 |         """
182 |         # Eliminate useless symbols
183 |         html = re.sub(r"[\u2018-\u201d\u2190-\u2193\u25a0-\u25bd\u25c6-\u25ef\u2605-\u2606]", "", html)
184 |         # Eliminate useless html tags
185 |         html = \
186 |             re.sub(r"(?is)<(script|style|select|noscript)[^>]*>.*?</\1\s*>",
187 |                    "", html)
188 |         html = re.sub(r"(?s)<!--.*?-->", "", html)
189 |         html = re.sub(r"<![A-Za-z].*?>/s", "", html)
190 |         html = re.sub((r"(?s)<div\s[^>]*class\s*=\s*['\"]?alpslab-slide"
191 |                        r"[\"']?[^>]*>.*?</div\s*>"), "", html)
192 |         html = re.sub((r"(?is)<div\s[^>]*(id|class)\s*=\s*['\"]"
193 |                        r"?\S*more\S*[\"']?[^>]*>"), "", html)
194 |         return html
195 | 
196 |     def _has_only_tags(self, st):
197 |         """
198 |         Checks if the given block has only tags without text.
199 |         """
200 |         st = re.sub(r"(?is)<[^>]*>", "", st)
201 |         st = re.sub(r"&nbsp;", "", st)
202 |         st = st.strip()
203 |         return len(st) == 0
204 | 
205 |     def _eliminate_link(self, html):
206 |         """
207 |         eliminate link tags
208 |         """
209 |         count = 0
210 |         notlinked, count = re.subn(r"(?is)<a\s[^>]*>.*?<\/a\s*>", "", html)
211 |         notlinked = re.sub(r"(?is)<form\s[^>]*>.*?</form\s*>", "", notlinked)
212 |         notlinked = self._strip_tags(notlinked)
213 |         # returns empty string when html contains many links or list of links
214 |         if (len(notlinked) < 20 * count) or (self._islinklist(html)):
215 |             return ""
216 |         return notlinked
217 | 
218 |     def _islinklist(self, st):
219 |         """
220 |         determines whether a block is link list or not
221 |         """
222 |         result = re.search(r"(?is)<(?:ul|dl|ol)(.+?)</(?:ul|dl|ol)>", st)
223 |         if result is not None:
224 |             listpart = result.group(1)
225 |             outside = re.sub(r"(?is)<(?:ul|dl)(.+?)</(?:ul|dl)>", "", st)
226 |             outside = re.sub(r"(?is)<.+?>", "", outside)
227 |             outside = re.sub(r"\s+", "", outside)
228 |             list = re.split(r"<li[^>]*>", listpart)
229 |             rate = self._evaluate_list(list)
230 |             return len(outside) <= len(st) / (45 / rate)
231 |         return False
232 | 
233 |     def _evaluate_list(self, list):
234 |         """
235 |         estimates how much degree of link list
236 |         """
237 |         if len(list) == 0:
238 |             return 1
239 |         hit = 0
240 |         href = re.compile("<a\s+href=(['\"]?)([^\"'\s]+)\1", re.I | re.S)
241 |         for line in list:
242 |             if href.search(line) is not None:
243 |                 hit += 1
244 |         return 9 * (1.0 * hit / len(list)) ** 2 + 1
245 | 
246 |     def _strip_tags(self, html):
247 |         """
248 |         Strips tags from html.
249 |         """
250 |         st = re.sub(r"(?s)<.+?>", "", html)
251 |         # Convert from wide character to ascii
252 |         if st and type(st) != str:
253 |             st = unicodedata.normalize("NFKC", st)
254 |         st = re.sub(r"[\u2500-\u253f\u2540-\u257f]", "", st)  # 罫線(keisen)
255 |         st = re.sub(r"&(.*?);", lambda x: self.CHARREF.get(x.group(1),
256 |                                                            x.group()), st)
257 |         st = re.sub(r"[ \t]+", " ", st)
258 |         st = re.sub(r"\n\s*", "\n", st)
259 |         return st
260 | 
261 | if __name__ == "__main__":
262 |     pass
263 | 


--------------------------------------------------------------------------------
/setup.py:
--------------------------------------------------------------------------------
 1 | from setuptools import setup, find_packages
 2 | from codecs import open
 3 | from os import path
 4 | 
 5 | here = path.abspath(path.dirname(__file__))
 6 | 
 7 | with open(path.join(here, "README.rst"), encoding="utf-8") as f:
 8 |     long_description = f.read()
 9 | 
10 | setup(
11 |     name="extractcontent3",
12 |     version="0.0.1",
13 |     description="",
14 |     long_description=long_description,
15 |     license="BSD 2-Clause",
16 |     url="https://github.com/kanjirz50/python-extractcontent3",
17 |     packages=find_packages(exclude=["contrib", "docs", "tests"]),
18 |     install_requires=[],
19 |     dependency_links=[],
20 |     python_requires='~=3.3',
21 | )
22 | 


--------------------------------------------------------------------------------
/tests/__init__.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/kanjirz50/python-extractcontent3/52c16984957c57f53d679f34b9d068cbefb5dd6a/tests/__init__.py


--------------------------------------------------------------------------------
/tests/blog.html:
--------------------------------------------------------------------------------
   1 | <!DOCTYPE html>
   2 | <!-- saved from url=(0049)http://kanji.hatenablog.jp/entry/python-xonsh-try -->
   3 | <html lang="ja" data-admin-domain="//blog.hatena.ne.jp" data-author="kanjirz50" data-avail-langs="ja en" data-blog="kanji.hatenablog.jp" data-blog-host="kanji.hatenablog.jp" data-blog-is-public="1" data-blog-name="かんちゃんの備忘録" data-blog-owner="kanjirz50" data-blog-uri="http://kanji.hatenablog.jp/" data-blog-uuid="10328749687186964311" data-blogs-uri-base="http://kanji.hatenablog.jp" data-brand="hatenablog" data-data-layer="{&quot;hatenablog&quot;:{&quot;admin&quot;:{},&quot;pro&quot;:&quot;free&quot;,&quot;page_id&quot;:&quot;entry&quot;,&quot;blog&quot;:{&quot;lang&quot;:&quot;ja&quot;,&quot;disable_ads&quot;:&quot;&quot;,&quot;enable_ads&quot;:&quot;true&quot;,&quot;name&quot;:&quot;\u304b\u3093\u3061\u3083\u3093\u306e\u5099\u5fd8\u9332&quot;,&quot;is_public&quot;:&quot;true&quot;,&quot;uri&quot;:&quot;http://kanji.hatenablog.jp/&quot;,&quot;is_sleeping&quot;:&quot;false&quot;,&quot;force_pc_view&quot;:&quot;false&quot;,&quot;entry_show_footer_related_entries&quot;:&quot;true&quot;,&quot;is_responsive_view&quot;:&quot;false&quot;,&quot;content_seems_japanese&quot;:&quot;true&quot;,&quot;enable_keyword_link&quot;:&quot;true&quot;,&quot;owner_name&quot;:&quot;kanjirz50&quot;},&quot;brand&quot;:&quot;hatenablog&quot;,&quot;analytics&quot;:{&quot;property_id&quot;:&quot;UA-84894610-3&quot;,&quot;non_sampling_property_id&quot;:&quot;&quot;,&quot;brand_property_id&quot;:&quot;&quot;,&quot;separated_property_id&quot;:&quot;UA-29716941-24&quot;},&quot;brand_tracking_category&quot;:&quot;hatenablog&quot;,&quot;permalink_entry&quot;:{&quot;hour&quot;:&quot;0&quot;,&quot;author_name&quot;:&quot;kanjirz50&quot;,&quot;date&quot;:&quot;2017-12-13&quot;,&quot;categories&quot;:&quot;&quot;,&quot;title&quot;:&quot;Xonsh\u3092\u4f7f\u3063\u3066\u307f\u305f&quot;,&quot;uri&quot;:&quot;http://kanji.hatenablog.jp/entry/python-xonsh-try&quot;},&quot;router_type&quot;:&quot;blogs&quot;}}" data-device="pc" data-dont-recommend-pro="false" data-globalheader-color="b" data-globalheader-type="pc" data-has-touch-view="1" data-page="entry" data-plus-available="" data-pro="false" data-router-type="blogs" data-static-domain="https://cdn.blog.st-hatena.com" data-version="b52004788defb2dcbf07a5cc7c17e1d8" itemscope="" itemtype="http://schema.org/Article" data-initial-state="{}"><head prefix="og: http://ogp.me/ns# fb: http://ogp.me/ns/fb# article: http://ogp.me/ns/article#"><meta http-equiv="Content-Type" content="text/html; charset=UTF-8"><script src="./blog_files/1733466696949178" async=""></script><script async="" src="./blog_files/fbevents.js.ダウンロード"></script><script async="" src="./blog_files/uwt.js.ダウンロード"></script><script type="text/javascript" async="" src="./blog_files/segmentation.js.ダウンロード"></script><script type="text/javascript" async="" src="./blog_files/pageviews"></script><script type="text/javascript" async="" src="./blog_files/segment"></script><script async="" src="./blog_files/tdim-0.11.2.js.ダウンロード"></script><script type="text/javascript" async="" src="./blog_files/conversion_async.js.ダウンロード"></script><script type="text/javascript" async="" src="./blog_files/conversion_async.js.ダウンロード"></script><script type="text/javascript" async="" src="./blog_files/conversion_async.js.ダウンロード"></script><script type="text/javascript" async="" src="./blog_files/conversion_async.js.ダウンロード"></script><script async="" src="./blog_files/gtm.js.ダウンロード"></script><script src="./blog_files/osd.js.ダウンロード"></script><script src="./blog_files/pubads_impl_rendering_177.js.ダウンロード"></script><script src="./blog_files/ads"></script><script type="text/javascript" src="./blog_files/us" async="" defer=""></script><script async="" type="text/javascript" src="./blog_files/dfp.config.json"></script><script type="text/javascript" async="" src="./blog_files/td.min.js.ダウンロード"></script><script type="text/javascript" async="" src="./blog_files/recaptcha__ja.js.ダウンロード"></script>
   4 |   
   5 |   <meta name="viewport" content="width=device-width, initial-scale=1.0">
   6 | 
   7 | 
   8 |   
   9 | 
  10 | 
  11 | 
  12 |   
  13 | 
  14 | 
  15 |   
  16 |   <meta http-equiv="X-UA-Compatible" content="IE=7; IE=9; IE=10; IE=11">
  17 |   <title>Xonshを使ってみた - かんちゃんの備忘録</title>
  18 | 
  19 |   
  20 |   <link rel="canonical" href="http://kanji.hatenablog.jp/entry/python-xonsh-try">
  21 | 
  22 | 
  23 | 
  24 |   
  25 |   
  26 | 
  27 | <meta itemprop="name" content="Xonshを使ってみた - かんちゃんの備忘録">
  28 | 
  29 |   <meta itemprop="image" content="https://cdn.blog.st-hatena.com/images/theme/og-image-1500.png">
  30 | 
  31 | 
  32 |   <meta property="og:title" content="Xonshを使ってみた - かんちゃんの備忘録">
  33 | <meta property="og:type" content="article">
  34 |   <meta property="og:url" content="http://kanji.hatenablog.jp/entry/python-xonsh-try">
  35 | 
  36 |   
  37 |   
  38 |   
  39 |   <meta property="og:image" content="https://cdn.blog.st-hatena.com/images/theme/og-image-1500.png">
  40 | 
  41 |     <meta property="og:description" content="【Xonsh Advent Calendar 2017の13日目の記事です。】 Xonshがいいという話を聞いて、これは使ってみないと！と思い使ってみました。 今良いんですよXonshが https://t.co/zSU1i0yxPo— ばんくし (@vaaaaanquish) 2017年11月24日 その備忘録です。">
  42 | <meta property="og:site_name" content="かんちゃんの備忘録">
  43 | 
  44 |   <meta property="article:published_time" content="1513090800">
  45 | 
  46 |       <meta name="twitter:card" content="summary">  <meta name="twitter:title" content="Xonshを使ってみた - かんちゃんの備忘録">    <meta name="twitter:description" content="【Xonsh Advent Calendar 2017の13日目の記事です。】 Xonshがいいという話を聞いて、これは使ってみないと！と思い使ってみました。 今良いんですよXonshが https://t.co/zSU1i0yxPo— ばんくし (@vaaaaanquish) 2017年11月24日 その備忘録です。">  <meta name="twitter:app:name:iphone" content="はてなブログアプリ">
  47 |   <meta name="twitter:app:id:iphone" content="583299321">
  48 |   <meta name="twitter:app:url:iphone" content="hatenablog:///open?uri=http%3A%2F%2Fkanji.hatenablog.jp%2Fentry%2Fpython-xonsh-try">  <meta name="twitter:site" content="@kanji250tr">
  49 |   
  50 |     <meta name="description" content="【Xonsh Advent Calendar 2017の13日目の記事です。】 Xonshがいいという話を聞いて、これは使ってみないと！と思い使ってみました。 今良いんですよXonshが https://t.co/zSU1i0yxPo— ばんくし (@vaaaaanquish) 2017年11月24日 その備忘録です。">
  51 | 
  52 |   
  53 | <script async="" type="text/javascript" src="./blog_files/us0"></script><script async="" type="text/javascript" src="./blog_files/td_htn_access.js.ダウンロード"></script><script async="" type="text/javascript" src="./blog_files/hatena_bigmining.js.ダウンロード"></script><script async="" type="text/javascript" src="./blog_files/user.segment.json"></script><script id="facebook-jssdk" src="./blog_files/sdk.js.ダウンロード"></script><script async="" type="text/javascript" src="./blog_files/gpt.js.ダウンロード"></script><script async="" type="text/javascript" src="./blog_files/audience"></script><script async="" src="./blog_files/apstag.js.ダウンロード"></script><script async="" type="text/javascript" src="./blog_files/jstag"></script><script type="text/javascript" async="" src="./blog_files/analytics.js.ダウンロード"></script><script async="" src="./blog_files/gtm.js(1).ダウンロード"></script><script id="embed-gtm-data-layer-loader" data-data-layer-page-specific="{&quot;hatenablog&quot;:{&quot;blogs_permalink&quot;:{&quot;is_blog_sleeping&quot;:&quot;false&quot;,&quot;blog_hide_afc_func&quot;:&quot;false&quot;,&quot;has_related_entries_with_elasticsearch&quot;:&quot;true&quot;,&quot;is_author_pro&quot;:&quot;false&quot;,&quot;blog_struct_hide_afc&quot;:&quot;false&quot;,&quot;blog_afc_issued&quot;:&quot;false&quot;,&quot;brand_hide_afc&quot;:&quot;false&quot;,&quot;entry_afc_issued&quot;:&quot;false&quot;,&quot;blog_hide_afc_field&quot;:&quot;false&quot;}}}">
  54 | (function() {
  55 |   function loadDataLayer(elem, attrName) {
  56 |     if (!elem) { return {}; }
  57 |     var json = elem.getAttribute(attrName);
  58 |     if (!json) { return {}; }
  59 |     return JSON.parse(json);
  60 |   }
  61 | 
  62 |   var globalVariables = loadDataLayer(
  63 |     document.documentElement,
  64 |     'data-data-layer'
  65 |   );
  66 |   var pageSpecificVariables = loadDataLayer(
  67 |     document.getElementById('embed-gtm-data-layer-loader'),
  68 |     'data-data-layer-page-specific'
  69 |   );
  70 | 
  71 |   var variables = [globalVariables, pageSpecificVariables];
  72 | 
  73 |   if (!window.dataLayer) {
  74 |     window.dataLayer = [];
  75 |   }
  76 | 
  77 |   for (var i = 0; i < variables.length; i++) {
  78 |     window.dataLayer.push(variables[i]);
  79 |   }
  80 | })();
  81 | </script>
  82 | <!-- Google Tag Manager -->
  83 | <script>(function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':
  84 | new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0],
  85 | j=d.createElement(s),dl=l!='dataLayer'?'&l='+l:'';j.async=true;j.src=
  86 | 'https://www.googletagmanager.com/gtm.js?id='+i+dl;f.parentNode.insertBefore(j,f);
  87 | })(window,document,'script','dataLayer','GTM-P4CXTW');</script>
  88 | <!-- End Google Tag Manager -->
  89 | 
  90 | 
  91 | 
  92 | 
  93 | 
  94 |   <link rel="shortcut icon" href="https://cdn.image.st-hatena.com/image/favicon/4f23891aec1d7abeaf50a63cf8ddbb362f3b72fc/version=1/https%3A%2F%2Fcdn.user.blog.st-hatena.com%2Fcustom_blog_icon%2F125871161%2F1514187551722936">
  95 | <link rel="icon" sizes="192x192" href="https://cdn.image.st-hatena.com/image/square/2e298f76002d94f9aca8ec019d02f87e89b32def/backend=imagemagick;height=192;version=1;width=192/https%3A%2F%2Fcdn.user.blog.st-hatena.com%2Fcustom_blog_icon%2F125871161%2F1514187551722936">
  96 | 
  97 |   
  98 | <link rel="alternate" type="application/atom+xml" title="Atom" href="http://kanji.hatenablog.jp/feed">
  99 | <link rel="alternate" type="application/rss+xml" title="RSS2.0" href="http://kanji.hatenablog.jp/rss">
 100 | <link rel="alternate" type="application/json+oembed" href="http://hatenablog.com/oembed?url=http%3A%2F%2Fkanji.hatenablog.jp%2Fentry%2Fpython-xonsh-try&amp;format=json" title="oEmbed Profile of Xonshを使ってみた">
 101 | <link rel="alternate" type="text/xml+oembed" href="http://hatenablog.com/oembed?url=http%3A%2F%2Fkanji.hatenablog.jp%2Fentry%2Fpython-xonsh-try&amp;format=xml" title="oEmbed Profile of Xonshを使ってみた">
 102 |   
 103 |   <link rel="author" href="http://www.hatena.ne.jp/kanjirz50/">
 104 | 
 105 | 
 106 |   
 107 |     <link rel="stylesheet" type="text/css" href="./blog_files/blog.css">
 108 | 
 109 |     
 110 |   <link rel="stylesheet" type="text/css" href="./blog_files/dc6b706a8274b06f4b0e52865bf98baa1d886e43">
 111 |   
 112 | 
 113 |   
 114 | 
 115 |   
 116 | <script> </script>
 117 | 
 118 |   
 119 | <style>
 120 |   div#google_afc_user,
 121 |   div.google-afc-user-container,
 122 |   div.google_afc_image,
 123 |   div.google_afc_blocklink {
 124 |       display: block !important;
 125 |   }
 126 | </style>
 127 | 
 128 | 
 129 |   
 130 | <script type="text/javascript" charset="utf-8" async="" src="./blog_files/button.df1da1fef194d8f8f3fd803a219a8177.js.ダウンロード"></script><script type="text/javascript" charset="utf-8" async="" src="./blog_files/tweet.05b3387999ca4bf3e9bd50ecbb81d2b3.js.ダウンロード"></script><link rel="preload" href="./blog_files/integrator.js.ダウンロード" as="script"><script type="text/javascript" src="./blog_files/integrator.js.ダウンロード"></script><link rel="preload" href="./blog_files/integrator.js(1).ダウンロード" as="script"><script type="text/javascript" src="./blog_files/integrator.js(1).ダウンロード"></script><script src="./blog_files/pubads_impl_177.js.ダウンロード" async=""></script><script src="./blog_files/entries.json" type="text/javascript"></script><style type="text/css">.fb_hidden{position:absolute;top:-10000px;z-index:10001}.fb_reposition{overflow:hidden;position:relative}.fb_invisible{display:none}.fb_reset{background:none;border:0;border-spacing:0;color:#000;cursor:auto;direction:ltr;font-family:"lucida grande", tahoma, verdana, arial, "hiragino kaku gothic pro",meiryo,"ms pgothic",sans-serif;font-size:11px;font-style:normal;font-variant:normal;font-weight:normal;letter-spacing:normal;line-height:1;margin:0;overflow:visible;padding:0;text-align:left;text-decoration:none;text-indent:0;text-shadow:none;text-transform:none;visibility:visible;white-space:normal;word-spacing:normal}.fb_reset>div{overflow:hidden}.fb_link img{border:none}@keyframes fb_transform{from{opacity:0;transform:scale(.95)}to{opacity:1;transform:scale(1)}}.fb_animate{animation:fb_transform .3s forwards}
 131 | .fb_dialog{background:rgba(82, 82, 82, .7);position:absolute;top:-10000px;z-index:10001}.fb_reset .fb_dialog_legacy{overflow:visible}.fb_dialog_advanced{padding:10px;-moz-border-radius:8px;-webkit-border-radius:8px;border-radius:8px}.fb_dialog_content{background:#fff;color:#333}.fb_dialog_close_icon{background:url(https://static.xx.fbcdn.net/rsrc.php/v3/yq/r/IE9JII6Z1Ys.png) no-repeat scroll 0 0 transparent;cursor:pointer;display:block;height:15px;position:absolute;right:18px;top:17px;width:15px}.fb_dialog_mobile .fb_dialog_close_icon{top:5px;left:5px;right:auto}.fb_dialog_padding{background-color:transparent;position:absolute;width:1px;z-index:-1}.fb_dialog_close_icon:hover{background:url(https://static.xx.fbcdn.net/rsrc.php/v3/yq/r/IE9JII6Z1Ys.png) no-repeat scroll 0 -15px transparent}.fb_dialog_close_icon:active{background:url(https://static.xx.fbcdn.net/rsrc.php/v3/yq/r/IE9JII6Z1Ys.png) no-repeat scroll 0 -30px transparent}.fb_dialog_loader{background-color:#f6f7f9;border:1px solid #606060;font-size:24px;padding:20px}.fb_dialog_top_left,.fb_dialog_top_right,.fb_dialog_bottom_left,.fb_dialog_bottom_right{height:10px;width:10px;overflow:hidden;position:absolute}.fb_dialog_top_left{background:url(https://static.xx.fbcdn.net/rsrc.php/v3/ye/r/8YeTNIlTZjm.png) no-repeat 0 0;left:-10px;top:-10px}.fb_dialog_top_right{background:url(https://static.xx.fbcdn.net/rsrc.php/v3/ye/r/8YeTNIlTZjm.png) no-repeat 0 -10px;right:-10px;top:-10px}.fb_dialog_bottom_left{background:url(https://static.xx.fbcdn.net/rsrc.php/v3/ye/r/8YeTNIlTZjm.png) no-repeat 0 -20px;bottom:-10px;left:-10px}.fb_dialog_bottom_right{background:url(https://static.xx.fbcdn.net/rsrc.php/v3/ye/r/8YeTNIlTZjm.png) no-repeat 0 -30px;right:-10px;bottom:-10px}.fb_dialog_vert_left,.fb_dialog_vert_right,.fb_dialog_horiz_top,.fb_dialog_horiz_bottom{position:absolute;background:#525252;filter:alpha(opacity=70);opacity:.7}.fb_dialog_vert_left,.fb_dialog_vert_right{width:10px;height:100%}.fb_dialog_vert_left{margin-left:-10px}.fb_dialog_vert_right{right:0;margin-right:-10px}.fb_dialog_horiz_top,.fb_dialog_horiz_bottom{width:100%;height:10px}.fb_dialog_horiz_top{margin-top:-10px}.fb_dialog_horiz_bottom{bottom:0;margin-bottom:-10px}.fb_dialog_iframe{line-height:0}.fb_dialog_content .dialog_title{background:#6d84b4;border:1px solid #365899;color:#fff;font-size:14px;font-weight:bold;margin:0}.fb_dialog_content .dialog_title>span{background:url(https://static.xx.fbcdn.net/rsrc.php/v3/yd/r/Cou7n-nqK52.gif) no-repeat 5px 50%;float:left;padding:5px 0 7px 26px}body.fb_hidden{-webkit-transform:none;height:100%;margin:0;overflow:visible;position:absolute;top:-10000px;left:0;width:100%}.fb_dialog.fb_dialog_mobile.loading{background:url(https://static.xx.fbcdn.net/rsrc.php/v3/ya/r/3rhSv5V8j3o.gif) white no-repeat 50% 50%;min-height:100%;min-width:100%;overflow:hidden;position:absolute;top:0;z-index:10001}.fb_dialog.fb_dialog_mobile.loading.centered{width:auto;height:auto;min-height:initial;min-width:initial;background:none}.fb_dialog.fb_dialog_mobile.loading.centered #fb_dialog_loader_spinner{width:100%}.fb_dialog.fb_dialog_mobile.loading.centered .fb_dialog_content{background:none}.loading.centered #fb_dialog_loader_close{color:#fff;display:block;padding-top:20px;clear:both;font-size:18px}#fb-root #fb_dialog_ipad_overlay{background:rgba(0, 0, 0, .45);position:absolute;bottom:0;left:0;right:0;top:0;width:100%;min-height:100%;z-index:10000}#fb-root #fb_dialog_ipad_overlay.hidden{display:none}.fb_dialog.fb_dialog_mobile.loading iframe{visibility:hidden}.fb_dialog_content .dialog_header{-webkit-box-shadow:white 0 1px 1px -1px inset;background:-webkit-gradient(linear, 0% 0%, 0% 100%, from(#738ABA), to(#2C4987));border-bottom:1px solid;border-color:#1d4088;color:#fff;font:14px Helvetica, sans-serif;font-weight:bold;text-overflow:ellipsis;text-shadow:rgba(0, 30, 84, .296875) 0 -1px 0;vertical-align:middle;white-space:nowrap}.fb_dialog_content .dialog_header table{-webkit-font-smoothing:subpixel-antialiased;height:43px;width:100%}.fb_dialog_content .dialog_header td.header_left{font-size:12px;padding-left:5px;vertical-align:middle;width:60px}.fb_dialog_content .dialog_header td.header_right{font-size:12px;padding-right:5px;vertical-align:middle;width:60px}.fb_dialog_content .touchable_button{background:-webkit-gradient(linear, 0% 0%, 0% 100%, from(#4966A6), color-stop(.5, #355492), to(#2A4887));border:1px solid #29487d;-webkit-background-clip:padding-box;-webkit-border-radius:3px;-webkit-box-shadow:rgba(0, 0, 0, .117188) 0 1px 1px inset, rgba(255, 255, 255, .167969) 0 1px 0;display:inline-block;margin-top:3px;max-width:85px;line-height:18px;padding:4px 12px;position:relative}.fb_dialog_content .dialog_header .touchable_button input{border:none;background:none;color:#fff;font:12px Helvetica, sans-serif;font-weight:bold;margin:2px -12px;padding:2px 6px 3px 6px;text-shadow:rgba(0, 30, 84, .296875) 0 -1px 0}.fb_dialog_content .dialog_header .header_center{color:#fff;font-size:16px;font-weight:bold;line-height:18px;text-align:center;vertical-align:middle}.fb_dialog_content .dialog_content{background:url(https://static.xx.fbcdn.net/rsrc.php/v3/y9/r/jKEcVPZFk-2.gif) no-repeat 50% 50%;border:1px solid #555;border-bottom:0;border-top:0;height:150px}.fb_dialog_content .dialog_footer{background:#f6f7f9;border:1px solid #555;border-top-color:#ccc;height:40px}#fb_dialog_loader_close{float:left}.fb_dialog.fb_dialog_mobile .fb_dialog_close_button{text-shadow:rgba(0, 30, 84, .296875) 0 -1px 0}.fb_dialog.fb_dialog_mobile .fb_dialog_close_icon{visibility:hidden}#fb_dialog_loader_spinner{animation:rotateSpinner 1.2s linear infinite;background-color:transparent;background-image:url(https://static.xx.fbcdn.net/rsrc.php/v3/yD/r/t-wz8gw1xG1.png);background-repeat:no-repeat;background-position:50% 50%;height:24px;width:24px}@keyframes rotateSpinner{0%{transform:rotate(0deg)}100%{transform:rotate(360deg)}}
 132 | .fb_iframe_widget{display:inline-block;position:relative}.fb_iframe_widget span{display:inline-block;position:relative;text-align:justify}.fb_iframe_widget iframe{position:absolute}.fb_iframe_widget_fluid_desktop,.fb_iframe_widget_fluid_desktop span,.fb_iframe_widget_fluid_desktop iframe{max-width:100%}.fb_iframe_widget_fluid_desktop iframe{min-width:220px;position:relative}.fb_iframe_widget_lift{z-index:1}.fb_hide_iframes iframe{position:relative;left:-10000px}.fb_iframe_widget_loader{position:relative;display:inline-block}.fb_iframe_widget_fluid{display:inline}.fb_iframe_widget_fluid span{width:100%}.fb_iframe_widget_loader iframe{min-height:32px;z-index:2;zoom:1}.fb_iframe_widget_loader .FB_Loader{background:url(https://static.xx.fbcdn.net/rsrc.php/v3/y9/r/jKEcVPZFk-2.gif) no-repeat;height:32px;width:32px;margin-left:-16px;position:absolute;left:50%;z-index:4}
 133 | .fb_invisible_flow{display:inherit;height:0;overflow-x:hidden;width:0}.fb_mobile_overlay_active{height:100%;overflow:hidden;position:fixed;width:100%}.fb_shrink_active{opacity:1;transform:scale(1, 1);transition-duration:200ms;transition-timing-function:ease-out}.fb_shrink_active:active{opacity:.5;transform:scale(.75, .75)}</style><script src="./blog_files/saved_resource"></script><script src="./blog_files/saved_resource(1)"></script><script src="./blog_files/saved_resource(2)"></script><script src="./blog_files/saved_resource(3)"></script></head>
 134 | 
 135 |   <body class="page-entry">
 136 |     
 137 |     <div id="header-container">
 138 |      <div id="sp-suggest" style="display: none;"><a id="sp-suggest-link" href="http://kanji.hatenablog.jp/entry/python-xonsh-try#">スマートフォン用の表示で見る</a></div>
 139 |     </div>
 140 | 
 141 |     <div id="globalheader-container" data-brand="hatenablog">
 142 |   <iframe id="globalheader" height="37" frameborder="0" allowtransparency="true" src="./blog_files/saved_resource.html"></iframe>
 143 | </div>
 144 | 
 145 | 
 146 |     <div id="container">
 147 |       <div id="container-inner">
 148 |         <header id="blog-title" data-brand="hatenablog">
 149 |   <div id="blog-title-inner">
 150 |     <div id="blog-title-content">
 151 |       <h1 id="title"><a href="http://kanji.hatenablog.jp/">かんちゃんの備忘録</a></h1>
 152 |       
 153 |         <h2 id="blog-description">プログラミングや言語処理、ガジェットなど個人の備忘録です。（メモ書き＋α）</h2>
 154 |       
 155 |     </div>
 156 |   </div>
 157 | </header>
 158 | 
 159 |         
 160 | 
 161 |         
 162 |         
 163 | 
 164 | 
 165 | 
 166 | 
 167 | <div id="content" class="hfeed">
 168 |   <div id="content-inner">
 169 |     <div id="wrapper">
 170 |       <div id="main">
 171 |         <div id="main-inner">
 172 |           
 173 | 
 174 | 
 175 |           
 176 |   
 177 |   <!-- google_ad_section_start -->
 178 |   <!-- rakuten_ad_target_begin -->
 179 |   
 180 |   
 181 |   
 182 | 
 183 |   
 184 | 
 185 |   
 186 |     
 187 |       
 188 |         <article class="entry hentry js-entry-article date-first autopagerize_page_element chars-200 words-100 mode-markdown entry-odd" id="entry-8599973812321690844" data-keyword-campaign="" data-uuid="8599973812321690844" data-publication-type="entry">
 189 |   <div class="entry-inner">
 190 |     <header class="entry-header">
 191 |     <div class="date entry-date first">
 192 |     <a href="http://kanji.hatenablog.jp/archive/2017/12/13" rel="nofollow">
 193 |       <time pubdate="" datetime="2017-12-12T15:00:00Z" title="2017-12-12T15:00:00Z">
 194 |         <span class="date-year">2017</span><span class="hyphen">-</span><span class="date-month">12</span><span class="hyphen">-</span><span class="date-day">13</span>
 195 |       </time>
 196 |     </a>
 197 |   </div>
 198 |   <h1 class="entry-title">
 199 |   <a href="http://kanji.hatenablog.jp/entry/python-xonsh-try" class="entry-title-link bookmark">Xonshを使ってみた</a>
 200 | </h1>
 201 | 
 202 |   
 203 |   
 204 | 
 205 | 
 206 |   
 207 | 
 208 |   
 209 | 
 210 | <div class="entry-header-menu"><a href="javascript:void">編集</a></div></header>
 211 | 
 212 |     
 213 | 
 214 |     <div class="entry-content">
 215 |   
 216 |     <p><a href="https://qiita.com/advent-calendar/2017/xonsh">【Xonsh Advent Calendar 2017の13日目の記事です。】</a></p>
 217 | 
 218 | <p>Xonshがいいという話を聞いて、これは使ってみないと！と思い使ってみました。</p>
 219 | 
 220 | <twitterwidget class="twitter-tweet twitter-tweet-rendered" id="twitter-widget-2" style="position: static; visibility: visible; display: block; transform: rotate(0deg); max-width: 100%; width: 500px; min-width: 220px; margin-top: 10px; margin-bottom: 10px;" data-tweet-id="934045710348984323"></twitterwidget>
 221 | 
 222 | 
 223 | <script async="" src="./blog_files/widgets.js.ダウンロード" charset="utf-8"></script>
 224 | 
 225 | 
 226 | <p>その備忘録です。</p>
 227 | 
 228 | <ul class="table-of-contents">
 229 |     <li><a href="http://kanji.hatenablog.jp/entry/python-xonsh-try#Xonsh%E3%81%A8%E3%81%AF">Xonshとは</a></li>
 230 |     <li><a href="http://kanji.hatenablog.jp/entry/python-xonsh-try#%E5%B0%8E%E5%85%A5">導入</a></li>
 231 |     <li><a href="http://kanji.hatenablog.jp/entry/python-xonsh-try#%E4%BD%BF%E3%81%A3%E3%81%A6%E3%81%BF%E3%81%9F">使ってみた</a><ul>
 232 |             <li><a href="http://kanji.hatenablog.jp/entry/python-xonsh-try#%E7%92%B0%E5%A2%83%E5%A4%89%E6%95%B0">環境変数</a></li>
 233 |             <li><a href="http://kanji.hatenablog.jp/entry/python-xonsh-try#Python-mode%E3%81%A8Subprocess-mode">Python-modeとSubprocess-mode</a></li>
 234 |             <li><a href="http://kanji.hatenablog.jp/entry/python-xonsh-try#Subprocess%E3%81%A8%E3%81%97%E3%81%A6">Subprocessとして</a></li>
 235 |         </ul>
 236 |     </li>
 237 |     <li><a href="http://kanji.hatenablog.jp/entry/python-xonsh-try#%E3%83%97%E3%83%AD%E3%82%BB%E3%82%B9%E7%BD%AE%E6%8F%9B%E3%81%8C%E3%81%A7%E3%81%8D%E3%81%AA%E3%81%84">プロセス置換ができない？</a></li>
 238 |     <li><a href="http://kanji.hatenablog.jp/entry/python-xonsh-try#%E4%BD%BF%E3%81%A3%E3%81%A6%E3%81%BF%E3%81%A6%E6%84%9F%E6%83%B3">使ってみて感想</a></li>
 239 | </ul>
 240 | 
 241 | <h2 id="Xonshとは">Xonshとは</h2>
 242 | 
 243 | <blockquote><p>the xonsh shell</p>
 244 | 
 245 | <p>~ こちらトム少佐からXonsh地上管制へ ~</p>
 246 | 
 247 | <p>Xonshは<a class="keyword" href="http://d.hatena.ne.jp/keyword/Python">Python</a>により動作する、<a class="keyword" href="http://d.hatena.ne.jp/keyword/%A5%AF%A5%ED%A5%B9%A5%D7%A5%E9%A5%C3%A5%C8%A5%D5%A5%A9%A1%BC%A5%E0">クロスプラットフォーム</a>で<a class="keyword" href="http://d.hatena.ne.jp/keyword/Unix">Unix</a>のようなシェル言語である<a class="keyword" href="http://d.hatena.ne.jp/keyword/%A5%B3%A5%DE%A5%F3%A5%C9%A5%D7%A5%ED%A5%F3%A5%D7%A5%C8">コマンドプロンプト</a>です。
 248 | この言語は<a class="keyword" href="http://d.hatena.ne.jp/keyword/Python">Python</a> 3.4+の上位互換で、慣れ親しんだ<a class="keyword" href="http://d.hatena.ne.jp/keyword/Bash">Bash</a>やIPythonなどの基本的なシェル命令を追加したものです。
 249 | <a class="keyword" href="http://d.hatena.ne.jp/keyword/Linux">Linux</a>やMac OSX、<a class="keyword" href="http://d.hatena.ne.jp/keyword/Windows">Windows</a>といったメジャーなシステム上で動作します。
 250 | Xonshは、普段使いで上級者も初級者も同じように使えるように作られています。</p></blockquote>
 251 | 
 252 | <p>勢いで<a href="http://xon.sh/">xonshトップページ</a>の冒頭を訳してみましたが、<code>This is major Tom to ground xonshtrol</code>は、<a class="keyword" href="http://d.hatena.ne.jp/keyword/%A5%C7%A5%D3%A5%C3%A5%C9%A1%A6%A5%DC%A5%A6%A5%A4">デビッド・ボウイ</a>の<a class="keyword" href="http://d.hatena.ne.jp/keyword/%A5%B9%A5%DA%A5%A4%A5%B9%A1%A6%A5%AA%A5%C7%A5%A3%A5%C6%A5%A3">スペイス・オディティ</a>の<code>This is major Tom to ground control</code>をもじっているようで、英語力のない自分には理解しがたいです（汗）</p>
 253 | 
 254 | <p>とにかく冒頭からは、<strong><a class="keyword" href="http://d.hatena.ne.jp/keyword/Python">Python</a>で作られた良い感じのシェルだ</strong>ということが分かったので使ってみます。</p>
 255 | 
 256 | <h2 id="導入">導入</h2>
 257 | 
 258 | <p><a class="keyword" href="http://d.hatena.ne.jp/keyword/Python">Python</a> 3.4以上の環境を用意して、<code>pip install xonsh</code>でインストールできます。</p>
 259 | 
 260 | <p>ログインシェルにする場合は、システムに<a class="keyword" href="http://d.hatena.ne.jp/keyword/Python">Python</a> 3.4以上をインストールしておくと安心かと思います。</p>
 261 | 
 262 | <h2 id="使ってみた">使ってみた</h2>
 263 | 
 264 | <p><a href="http://xon.sh/tutorial.html">Tutorial</a>見ながら使ってみて、普段使っている<a class="keyword" href="http://d.hatena.ne.jp/keyword/zsh">zsh</a>とは異なる機能や文法に触れました。
 265 | （ノリで記事を書いてみたら、<a href="http://vaaaaaanquish.hatenablog.com/entry/2017/11/30/175236">ばんくしさんの1日目の記事</a>と結構<a class="keyword" href="http://d.hatena.ne.jp/keyword/%A4%AB%A4%D6">かぶ</a>ってしまいました(<em> </em>)）</p>
 266 | 
 267 | <h3 id="環境変数"><a class="keyword" href="http://d.hatena.ne.jp/keyword/%B4%C4%B6%AD%CA%D1%BF%F4">環境変数</a></h3>
 268 | 
 269 | <p><code>$</code>+変数名が<a class="keyword" href="http://d.hatena.ne.jp/keyword/%B4%C4%B6%AD%CA%D1%BF%F4">環境変数</a>となります。また代入は、<a class="keyword" href="http://d.hatena.ne.jp/keyword/Python">Python</a>と同じように記述します。</p>
 270 | 
 271 | <pre class="code lang-python" data-lang="python" data-unlink="">username<span class="synPreProc">@</span><span class="synIdentifier">hostname</span> ~ $ $HOST
 272 | <span class="synConstant">'hostname'</span>
 273 | username<span class="synPreProc">@</span><span class="synIdentifier">hostname</span> ~ $ $HOST = <span class="synConstant">"hogefuga"</span>
 274 | username<span class="synPreProc">@</span><span class="synIdentifier">hostname</span> ~ $ $HOST
 275 | <span class="synConstant">'hogefuga'</span>
 276 | </pre>
 277 | 
 278 | 
 279 | <p>xonsh<a class="keyword" href="http://d.hatena.ne.jp/keyword/%A5%B9%A5%AF%A5%EA%A5%D7%A5%C8">スクリプト</a>から参照したいときは、<code>${}</code>構文を使うことで文字列で参照できます。</p>
 280 | 
 281 | <pre class="code lang-python" data-lang="python" data-unlink="">username<span class="synPreProc">@</span><span class="synIdentifier">hostname</span> ~ $ ${<span class="synConstant">"HOME"</span>}
 282 | <span class="synConstant">"/home/username"</span>
 283 | </pre>
 284 | 
 285 | 
 286 | <h3 id="Python-modeとSubprocess-mode"><a class="keyword" href="http://d.hatena.ne.jp/keyword/Python">Python</a>-modeとSubprocess-mode</h3>
 287 | 
 288 | <p>xonshを使っていると、まるでIPythonのような使い勝手で<a class="keyword" href="http://d.hatena.ne.jp/keyword/bash">bash</a> likeな<a class="keyword" href="http://d.hatena.ne.jp/keyword/Python">Python</a>というように思えてきます。
 289 | 両方の文法が使えるのですが、混在すると曖昧となるため、コマンドと同名の変数名やメソッド名は避けましょうというお話です。</p>
 290 | 
 291 | <pre class="code lang-python" data-lang="python" data-unlink="">username<span class="synPreProc">@</span><span class="synIdentifier">hostname</span> ~ $ ls = <span class="synConstant">44</span>
 292 | username<span class="synPreProc">@</span><span class="synIdentifier">hostname</span> ~ $ ls
 293 | <span class="synConstant">44</span>
 294 | username<span class="synPreProc">@</span><span class="synIdentifier">hostname</span> ~ $ <span class="synStatement">del</span> ls
 295 | username<span class="synPreProc">@</span><span class="synIdentifier">hostname</span> ~ $ ls
 296 | ...
 297 | </pre>
 298 | 
 299 | 
 300 | <h3 id="Subprocessとして">Subprocessとして</h3>
 301 | 
 302 | <p><code>$()</code>でコマンドを実行すると、<a class="keyword" href="http://d.hatena.ne.jp/keyword/Python">Python</a>でSubprocessを使ったときのように、コマンドの戻り値が文字列型で返ってきます。</p>
 303 | 
 304 | <pre class="code lang-python" data-lang="python" data-unlink="">username<span class="synPreProc">@</span><span class="synIdentifier">hostname</span> ~ $ $(ls)
 305 | hoge\nfuga\ndotfiles
 306 | </pre>
 307 | 
 308 | 
 309 | <p><code>$[]</code>という書き方でもSubprocessとして動作させられますが、直に標準出力に出力されるようで、戻り値としては<code>None</code>です。
 310 | パイプなどで渡すとエラーとなりました。</p>
 311 | 
 312 | <pre class="code lang-python" data-lang="python" data-unlink="">username<span class="synPreProc">@</span><span class="synIdentifier">hostname</span> ~ $ $[ls]|less
 313 | hoge
 314 | fuga
 315 | ...
 316 | xonsh: For full traceback <span class="synIdentifier">set</span>: $XONSH_SHOW_TRACEBACK = <span class="synIdentifier">True</span>
 317 | <span class="synType">AttributeError</span>: <span class="synConstant">'NoneType'</span> <span class="synIdentifier">object</span> has no attribute <span class="synConstant">'splitlines'</span>
 318 | username<span class="synPreProc">@</span><span class="synIdentifier">hostname</span> ~ $ $[ls] == <span class="synIdentifier">None</span>
 319 | hoge
 320 | fuga
 321 | ...
 322 | <span class="synIdentifier">True</span>
 323 | </pre>
 324 | 
 325 | 
 326 | <h2 id="プロセス置換ができない">プロセス置換ができない？</h2>
 327 | 
 328 | <p><a class="keyword" href="http://d.hatena.ne.jp/keyword/bash">bash</a>や<a class="keyword" href="http://d.hatena.ne.jp/keyword/zsh">zsh</a>で一時ファイルを作成するかわりに、プロセス置換で作業することが多いです。
 329 | プロセス置換は<a class="keyword" href="http://d.hatena.ne.jp/keyword/bash">bash</a>や<a class="keyword" href="http://d.hatena.ne.jp/keyword/zsh">zsh</a>に搭載されている便利な機能の一つで、引数でファイルを指定するかわりにコマンドの実行結果をファイルとして扱える機能です。
 330 | つまり中間ファイルが不要ということです。（どの中間ファイルを使ったか忘れがちですが、これだとコマンドの履歴として記録されます。）</p>
 331 | 
 332 | <p>入力をプロセス置換するのは、だいたい2つ以上のファイルを利用するコマンドを使うときです。（ひとつのファイルなら基本的にはパイプで）
 333 | diffを取る時やjoin、pasteなどで、以下のように使います。</p>
 334 | 
 335 | <pre class="code lang-sh" data-lang="sh" data-unlink="">username@hostname ~ $ diff <span class="synStatement">&lt;</span><span class="synPreProc">(</span><span class="synStatement">sort</span><span class="synSpecial"> -nrk1 hoge.txt</span><span class="synPreProc">)</span> <span class="synStatement">&lt;</span><span class="synPreProc">(</span><span class="synStatement">sort</span><span class="synSpecial"> -nrk1 fuga.txt</span><span class="synPreProc">)</span>
 336 | </pre>
 337 | 
 338 | 
 339 | <p>Issueを<code>process substitution</code>で検索してみると、現時点（2017/12/10）で一番新しいものは<a href="https://github.com/xonsh/xonsh/issues/1307">Issue 1307</a>で、プロセス置換は使えないようです。
 340 | <code>$(echo Hi Mom &gt; /tmp/mom)</code>が<code>/tmp/mom</code>を返すので、プロセス置換と似たことができると読めたのですが、v0.6.0では空文字列が返ってきました。</p>
 341 | 
 342 | <p>詳しい人、教えてください。</p>
 343 | 
 344 | <h2 id="使ってみて感想">使ってみて感想</h2>
 345 | 
 346 | <p>シェルの設定ファイルを書かない人や、プロセス置換などを利用しない人にとっては、十分すぎる補完機能や<a class="keyword" href="http://d.hatena.ne.jp/keyword/%A5%B7%A5%F3%A5%BF%A5%C3%A5%AF%A5%B9">シンタックス</a>ハイライトと感じました。</p>
 347 | 
 348 | <p><a class="keyword" href="http://d.hatena.ne.jp/keyword/zsh">zsh</a>から乗り換えるとなると、勝手が違うため覚えることが多いように思います。</p>
 349 | 
 350 | <p><a class="keyword" href="http://d.hatena.ne.jp/keyword/Python">Python</a>言語が使えるという利点を活かす利用法を考えたいです。
 351 | たぶん、<a class="keyword" href="http://d.hatena.ne.jp/keyword/awk">awk</a>や<a class="keyword" href="http://d.hatena.ne.jp/keyword/perl">perl</a>、<a class="keyword" href="http://d.hatena.ne.jp/keyword/sed">sed</a>を使うかわりにうまく使えるのだと思います。</p>
 352 | 
 353 |   
 354 | </div>
 355 | 
 356 |     
 357 |   <footer class="entry-footer">
 358 |     
 359 |     <p class="entry-footer-section">
 360 |   <span class="author vcard"><span class="fn" data-load-nickname="1" data-user-name="kanjirz50"><span class="user-name-nickname">かんちゃん</span> <span class="user-name-paren">(</span><span class="user-name-hatena-id">id:kanjirz50</span><span class="user-name-paren">)</span></span></span>
 361 |   <span class="entry-footer-time"><a href="http://kanji.hatenablog.jp/entry/python-xonsh-try"><time data-relative="" datetime="2017-12-12T15:00:00Z" title="2017-12-12T15:00:00Z" pubdate="" class="updated">49日前</time></a></span>
 362 | </p>
 363 | 
 364 |     
 365 |   <div class="hatena-star-container">
 366 |   <span class="hatena-star-comment-container"><img src="./blog_files/comment.gif" tabindex="0" alt="Comments" title="Comments" class="hatena-star-comment-button" style="cursor: pointer; margin: 0px 3px; padding: 0px; border: none; vertical-align: middle; display: inline;"></span><span class="hatena-star-star-container"><img src="./blog_files/hatena-star-add-button.png" tabindex="0" alt="Add Star" title="Add Star" class="hatena-star-add-button" style="cursor: pointer; margin: 0px 3px; padding: 0px; border: none; vertical-align: middle;"></span></div>
 367 |   <div class="hatena-star-metadata" style="display: none">
 368 |     <a class="hatena-star-permalink" href="http://kanji.hatenablog.jp/entry/python-xonsh-try">Xonshを使ってみた</a>
 369 |   </div>
 370 | 
 371 | 
 372 |     
 373 | <div class="social-buttons">
 374 |   
 375 |   
 376 |     <div class="social-button-item">
 377 |       <iframe class="hatena-bookmark-button-frame" title="この記事をはてなブックマークに追加" frameborder="0" scrolling="no" width="84" height="40" src="javascript:false" style="width: 84px; height: 40px;" src="./blog_files/saved_resource(4).html"></iframe>
 378 |     </div>
 379 |   
 380 |   
 381 |     <div class="social-button-item">
 382 |       <div class="fb-share-button fb_iframe_widget" data-layout="box_count" data-href="http://kanji.hatenablog.jp/entry/python-xonsh-try" fb-xfbml-state="rendered" fb-iframe-plugin-query="app_id=719729204785177&amp;container_width=0&amp;href=http%3A%2F%2Fkanji.hatenablog.jp%2Fentry%2Fpython-xonsh-try&amp;layout=box_count&amp;locale=ja_JP&amp;sdk=joey"><span style="vertical-align: bottom; width: 61px; height: 40px;"><iframe name="f114e2ae99b028" width="1000px" height="1000px" frameborder="0" allowtransparency="true" allowfullscreen="true" scrolling="no" title="fb:share_button Facebook Social Plugin" src="./blog_files/share_button.html" style="border: none; visibility: visible; width: 61px; height: 40px;" class=""></iframe></span></div>
 383 |     </div>
 384 |   
 385 |   
 386 |     <div class="social-button-item">
 387 |       <iframe id="twitter-widget-1" scrolling="no" frameborder="0" allowtransparency="true" class="twitter-share-button twitter-share-button-rendered twitter-tweet-button" title="Twitter Tweet Button" src="./blog_files/tweet_button.83d5793f6ebbe2046330abda6016ae93.ja.html" style="position: static; visibility: visible; width: 75px; height: 20px;" data-url="http://kanji.hatenablog.jp/entry/python-xonsh-try"></iframe>
 388 |     </div>
 389 |   
 390 |   
 391 |   
 392 |   
 393 |   
 394 | </div>
 395 | 
 396 |     
 397 |   
 398 |   
 399 |     
 400 |     <div class="google-afc-image test-google-rectangle-ads">
 401 |       <script>
 402 |   var hatenadfp = hatenadfp || {};
 403 |   hatenadfp.adUnits = hatenadfp.adUnits || [];
 404 |   hatenadfp.adUnits.push(
 405 |     
 406 |       
 407 |       
 408 |       { unitName: 'blog_user', size: [[300, 250], [336, 280], [468, 60], ["fluid"]], divId: 'google_afc_user_container_0', allowContentMatch: true }
 409 |     
 410 |   );
 411 |   hatenadfp.isNGContent = false;
 412 |   
 413 | </script>
 414 | 
 415 |       <div id="google_afc_user_container_0" class="google-afc-user-container  google_afc_blocklink2_5 google_afc_boder" data-google-query-id="CM_QuO2UgtkCFUObvAodJhIJeg"><div id="google_ads_iframe_/4374287/rectarectanglematch_cygames_attype_2_0__container__" style="border: 0pt none; display: inline-block; width: 300px; height: 250px;"><iframe frameborder="0" src="./blog_files/container.html" id="google_ads_iframe_/4374287/rectarectanglematch_cygames_attype_2_0" title="3rd party ad content" name="" scrolling="no" marginwidth="0" marginheight="0" width="300" height="250" data-is-safeframe="true" sandbox="allow-forms allow-pointer-lock allow-popups allow-popups-to-escape-sandbox allow-same-origin allow-scripts allow-top-navigation-by-user-activation" style="border: 0px; vertical-align: bottom;"></iframe></div></div>
 416 |       
 417 |         <a href="http://blog.hatena.ne.jp/guide/pro" class="open-pro-modal" data-guide-pro-modal-ad-url="http://hatenablog.com/guide/pro/modal/ad" style="visibility: visible;">広告を非表示にする</a>
 418 |       
 419 |       
 420 |     </div>
 421 |   
 422 | 
 423 | 
 424 |     <div class="customized-footer">
 425 |       
 426 | 
 427 |         
 428 | 
 429 |         
 430 | 
 431 |           <div class="entry-footer-modules" id="entry-footer-secondary-modules">      
 432 | <div class="hatena-module hatena-module-related-entries">
 433 |       
 434 |   <!-- Hatena-Epic-has-related-entries-with-elasticsearch:true -->
 435 |   <div class="hatena-module-title">
 436 |     関連記事
 437 |   </div>
 438 |   <div class="hatena-module-body">
 439 |     <ul class="related-entries hatena-urllist urllist-with-thumbnails">
 440 |   
 441 |   
 442 |     
 443 |     <li class="urllist-item related-entries-item">
 444 |       <div class="urllist-item-inner related-entries-item-inner">
 445 |         
 446 |                       <div class="urllist-date-link related-entries-date-link">
 447 |   <a href="http://kanji.hatenablog.jp/archive/2017/12/04" rel="nofollow">
 448 |     <time pubdate="" datetime="2017-12-03T15:00:00Z" title="2017-12-03T15:00:00Z">
 449 |       2017-12-04
 450 |     </time>
 451 |   </a>
 452 | </div>
 453 | 
 454 |           <a href="http://kanji.hatenablog.jp/entry/python-requests-beautifulsoup-encoding" class="urllist-title-link related-entries-title-link  urllist-title related-entries-title">Pythonのrequestsモジュールでの文字コード対策</a>
 455 | 
 456 | 
 457 |           
 458 |           
 459 | 
 460 |                       <div class="urllist-entry-body related-entries-entry-body">【Webスクレイピング Advent Calendar 2017 4日目の記事です。…</div>
 461 |       </div>
 462 |     </li>
 463 |   
 464 |     
 465 |     <li class="urllist-item related-entries-item">
 466 |       <div class="urllist-item-inner related-entries-item-inner">
 467 |         
 468 |                       <div class="urllist-date-link related-entries-date-link">
 469 |   <a href="http://kanji.hatenablog.jp/archive/2017/12/01" rel="nofollow">
 470 |     <time pubdate="" datetime="2017-11-30T15:00:00Z" title="2017-11-30T15:00:00Z">
 471 |       2017-12-01
 472 |     </time>
 473 |   </a>
 474 | </div>
 475 | 
 476 |           <a href="http://kanji.hatenablog.jp/entry/python-hug-api-cli" class="urllist-title-link related-entries-title-link  urllist-title related-entries-title">hugでAPIやCLIを作る</a>
 477 | 
 478 | 
 479 |           
 480 |           
 481 | 
 482 |                       <div class="urllist-entry-body related-entries-entry-body">【Sansan Advent Calendar 2017 1日目の記事です。】 Pythonで…</div>
 483 |       </div>
 484 |     </li>
 485 |   
 486 |     
 487 |     <li class="urllist-item related-entries-item">
 488 |       <div class="urllist-item-inner related-entries-item-inner">
 489 |         
 490 |                       <div class="urllist-date-link related-entries-date-link">
 491 |   <a href="http://kanji.hatenablog.jp/archive/2017/02/18" rel="nofollow">
 492 |     <time pubdate="" datetime="2017-02-17T15:19:48Z" title="2017-02-17T15:19:48Z">
 493 |       2017-02-18
 494 |     </time>
 495 |   </a>
 496 | </div>
 497 | 
 498 |           <a href="http://kanji.hatenablog.jp/entry/2017/02/18/001948" class="urllist-title-link related-entries-title-link  urllist-title related-entries-title">研究室の計算機管理者のススメ（２）OS</a>
 499 | 
 500 | 
 501 |           
 502 |           
 503 | 
 504 |                       <div class="urllist-entry-body related-entries-entry-body">土台をつくろう！ 今回は計算機環境の土台作りということで、以…</div>
 505 |       </div>
 506 |     </li>
 507 |   
 508 |     
 509 |     <li class="urllist-item related-entries-item">
 510 |       <div class="urllist-item-inner related-entries-item-inner">
 511 |         
 512 |                       <div class="urllist-date-link related-entries-date-link">
 513 |   <a href="http://kanji.hatenablog.jp/archive/2016/11/04" rel="nofollow">
 514 |     <time pubdate="" datetime="2016-11-04T05:23:00Z" title="2016-11-04T05:23:00Z">
 515 |       2016-11-04
 516 |     </time>
 517 |   </a>
 518 | </div>
 519 | 
 520 |           <a href="http://kanji.hatenablog.jp/entry/zsh%E3%81%A7%E5%BC%95%E6%95%B0%E3%81%AB%E6%8C%87%E5%AE%9A%E3%81%97%E3%81%9F%E3%83%95%E3%82%A1%E3%82%A4%E3%83%AB%E3%81%AE%E7%B5%B6%E5%AF%BE%E3%83%91%E3%82%B9%E3%82%92%E5%8F%96%E5%BE%97" class="urllist-title-link related-entries-title-link  urllist-title related-entries-title">zshで引数に指定したファイルの絶対パスを取得</a>
 521 | 
 522 | 
 523 |           
 524 |           
 525 | 
 526 |                       <div class="urllist-entry-body related-entries-entry-body">引数の相対パスを絶対パスに展開する「ls test.txt」みたいに相…</div>
 527 |       </div>
 528 |     </li>
 529 |   
 530 | </ul>
 531 | 
 532 |   </div>
 533 | </div>
 534 |   </div>
 535 |         
 536 | 
 537 |       
 538 |     </div>
 539 |     
 540 |   <div class="comment-box">
 541 |     
 542 |     <ul class="comment">
 543 |       <li class="read-more-comments" style="display: none;"><a>もっと読む</a></li>
 544 |     </ul>
 545 |     
 546 |       <a class="leave-comment-title">コメントを書く</a>
 547 |     
 548 |   </div>
 549 | 
 550 |   </footer>
 551 | 
 552 |   </div>
 553 | </article>
 554 | 
 555 |       
 556 |       
 557 |     
 558 |   
 559 | 
 560 |   
 561 |   <!-- rakuten_ad_target_end -->
 562 |   <!-- google_ad_section_end -->
 563 |   
 564 |   
 565 |   
 566 |   <div class="pager pager-permalink permalink">
 567 |     
 568 |     
 569 |       
 570 |       <span class="pager-next">
 571 |         <a href="http://kanji.hatenablog.jp/entry/python-requests-beautifulsoup-encoding" rel="next">
 572 |           Pythonのrequestsモジュールでの文字コー…
 573 |           <span class="pager-arrow"> »</span>
 574 |         </a>
 575 |       </span>
 576 |     
 577 |   </div>
 578 | 
 579 | 
 580 |   
 581 | 
 582 | 
 583 | 
 584 |         </div>
 585 |       </div>
 586 | 
 587 |       <aside id="box1">
 588 |   <div id="box1-inner">
 589 |   </div>
 590 | </aside>
 591 | 
 592 |     </div><!-- #wrapper -->
 593 | 
 594 |     
 595 | <aside id="box2">
 596 |   
 597 |   <div id="box2-inner">
 598 |     
 599 |       
 600 | 
 601 | <div class="hatena-module hatena-module-profile">
 602 |   <div class="hatena-module-title">
 603 |     プロフィール
 604 |   </div>
 605 |   <div class="hatena-module-body">
 606 |     
 607 |     <a href="http://kanji.hatenablog.jp/about" class="profile-icon-link">
 608 |       <img src="./blog_files/profile.png" alt="id:kanjirz50" class="profile-icon">
 609 |     </a>
 610 |     
 611 | 
 612 |     
 613 |     <span class="id">
 614 |       <a href="http://kanji.hatenablog.jp/about" class="hatena-id-link"><span data-load-nickname="1" data-user-name="kanjirz50"><span class="user-name-nickname">かんちゃん</span> <span class="user-name-paren">(</span><span class="user-name-hatena-id">id:kanjirz50</span><span class="user-name-paren">)</span></span></a>
 615 |       
 616 |   
 617 |     
 618 |     
 619 |   
 620 | 
 621 | 
 622 |     </span>
 623 |     
 624 | 
 625 |     
 626 | 
 627 |     
 628 |     <div class="profile-description">
 629 |       <p>プログラミングや言語処理、ガジェットなど個人の備忘録です。（メモ書き＋α）</p>
 630 | 
 631 |     </div>
 632 |     
 633 | 
 634 |     
 635 |       <div class="hatena-follow-button-box btn-subscribe js-hatena-follow-button-box">
 636 | 
 637 |   <a href="http://kanji.hatenablog.jp/entry/python-xonsh-try#" class="hatena-follow-button js-hatena-follow-button unsubscribing">
 638 |     <span class="subscribing">
 639 |       <span class="foreground">読者です</span>
 640 |       <span class="background">読者をやめる</span>
 641 |     </span>
 642 |     <span class="unsubscribing" data-track-name="profile-widget-subscribe-button" data-track-once="">
 643 |       <span class="foreground">読者になる</span>
 644 |       <span class="background">読者になる</span>
 645 |     </span>
 646 |   </a>
 647 |   <div class="subscription-count-box js-subscription-count-box" style="display: block;">
 648 |     <i></i>
 649 |     <u></u>
 650 |     <span class="subscription-count js-subscription-count">6</span>
 651 |   </div>
 652 | </div>
 653 | 
 654 |     
 655 | 
 656 |     
 657 |     <div class="hatena-follow-button-box btn-twitter">
 658 |       <iframe id="twitter-widget-0" scrolling="no" frameborder="0" allowtransparency="true" class="twitter-follow-button twitter-follow-button-rendered" title="Twitter Follow Button" src="./blog_files/follow_button.83d5793f6ebbe2046330abda6016ae93.ja.html" style="position: static; visibility: visible; width: 167px; height: 20px;" data-screen-name="kanji250tr"></iframe>
 659 |     </div>
 660 |     
 661 | 
 662 |     
 663 |   </div>
 664 | </div>
 665 | 
 666 |     
 667 |       <div class="hatena-module hatena-module-search-box">
 668 |   <div class="hatena-module-title">
 669 |     検索
 670 |   </div>
 671 |   <div class="hatena-module-body">
 672 |     <form class="search-form" role="search" action="http://kanji.hatenablog.jp/search" method="get">
 673 |   <input type="text" name="q" class="search-module-input" value="" placeholder="記事を検索" required="" data-cip-id="cIPJQ342845639">
 674 |   <input type="submit" value="検索" class="search-module-button">
 675 | </form>
 676 | 
 677 |   </div>
 678 | </div>
 679 | 
 680 |     
 681 |       <div class="hatena-module hatena-module-recent-entries ">
 682 |   <div class="hatena-module-title">
 683 |     <a href="http://kanji.hatenablog.jp/archive">
 684 |       最新記事
 685 |     </a>
 686 |   </div>
 687 |   <div class="hatena-module-body">
 688 |     <ul class="recent-entries hatena-urllist ">
 689 |   
 690 |   
 691 |     
 692 |     <li class="urllist-item recent-entries-item">
 693 |       <div class="urllist-item-inner recent-entries-item-inner">
 694 |         
 695 |           
 696 |           <a href="http://kanji.hatenablog.jp/entry/python-xonsh-try" class="urllist-title-link recent-entries-title-link  urllist-title recent-entries-title">Xonshを使ってみた</a>
 697 | 
 698 | 
 699 |           
 700 |           
 701 | 
 702 |                 </div>
 703 |     </li>
 704 |   
 705 |     
 706 |     <li class="urllist-item recent-entries-item">
 707 |       <div class="urllist-item-inner recent-entries-item-inner">
 708 |         
 709 |           
 710 |           <a href="http://kanji.hatenablog.jp/entry/python-requests-beautifulsoup-encoding" class="urllist-title-link recent-entries-title-link  urllist-title recent-entries-title">Pythonのrequestsモジュールでの文字コード対策</a>
 711 | 
 712 | 
 713 |           
 714 |           
 715 | 
 716 |                 </div>
 717 |     </li>
 718 |   
 719 |     
 720 |     <li class="urllist-item recent-entries-item">
 721 |       <div class="urllist-item-inner recent-entries-item-inner">
 722 |         
 723 |           
 724 |           <a href="http://kanji.hatenablog.jp/entry/python-hug-api-cli" class="urllist-title-link recent-entries-title-link  urllist-title recent-entries-title">hugでAPIやCLIを作る</a>
 725 | 
 726 | 
 727 |           
 728 |           
 729 | 
 730 |                 </div>
 731 |     </li>
 732 |   
 733 |     
 734 |     <li class="urllist-item recent-entries-item">
 735 |       <div class="urllist-item-inner recent-entries-item-inner">
 736 |         
 737 |           
 738 |           <a href="http://kanji.hatenablog.jp/entry/2017/11/19/213746" class="urllist-title-link recent-entries-title-link  urllist-title recent-entries-title">ICDAR2017に参加した</a>
 739 | 
 740 | 
 741 |           
 742 |           
 743 | 
 744 |                 </div>
 745 |     </li>
 746 |   
 747 |     
 748 |     <li class="urllist-item recent-entries-item">
 749 |       <div class="urllist-item-inner recent-entries-item-inner">
 750 |         
 751 |           
 752 |           <a href="http://kanji.hatenablog.jp/entry/2017/06/02/lt-hackers-gate" class="urllist-title-link recent-entries-title-link  urllist-title recent-entries-title">Hacker's GATE LT大会に参加した</a>
 753 | 
 754 | 
 755 |           
 756 |           
 757 | 
 758 |                 </div>
 759 |     </li>
 760 |   
 761 | </ul>
 762 | 
 763 |   </div>
 764 | </div>
 765 | 
 766 |     
 767 |       
 768 | 
 769 | <div class="hatena-module hatena-module-archive" data-archive-type="default" data-archive-url="http://kanji.hatenablog.jp/archive">
 770 |   <div class="hatena-module-title">
 771 |     <a href="http://kanji.hatenablog.jp/archive">月別アーカイブ</a>
 772 |   </div>
 773 |   <div class="hatena-module-body">
 774 |   
 775 | 
 776 |   
 777 |     
 778 |     
 779 |       <ul class="hatena-urllist">
 780 |         
 781 |           <li class="archive-module-year" data-year="2017">
 782 |             <div class="archive-module-button">
 783 |               <span class="archive-module-hide-button">▼</span>
 784 |               <span class="archive-module-show-button">▶</span>
 785 |             </div>
 786 |             <a href="http://kanji.hatenablog.jp/archive/2017" class="archive-module-year-title">
 787 |               2017 (11)
 788 |             </a>
 789 |             <ul class="archive-module-months">
 790 |               
 791 |                 <li class="archive-module-month">
 792 |                   <a href="http://kanji.hatenablog.jp/archive/2017/12" class="archive-module-month-title">
 793 |                     2017 / 12 (3)
 794 |                   </a>
 795 |                 </li>
 796 |               
 797 |                 <li class="archive-module-month">
 798 |                   <a href="http://kanji.hatenablog.jp/archive/2017/11" class="archive-module-month-title">
 799 |                     2017 / 11 (1)
 800 |                   </a>
 801 |                 </li>
 802 |               
 803 |                 <li class="archive-module-month">
 804 |                   <a href="http://kanji.hatenablog.jp/archive/2017/6" class="archive-module-month-title">
 805 |                     2017 / 6 (1)
 806 |                   </a>
 807 |                 </li>
 808 |               
 809 |                 <li class="archive-module-month">
 810 |                   <a href="http://kanji.hatenablog.jp/archive/2017/5" class="archive-module-month-title">
 811 |                     2017 / 5 (2)
 812 |                   </a>
 813 |                 </li>
 814 |               
 815 |                 <li class="archive-module-month">
 816 |                   <a href="http://kanji.hatenablog.jp/archive/2017/2" class="archive-module-month-title">
 817 |                     2017 / 2 (4)
 818 |                   </a>
 819 |                 </li>
 820 |               
 821 |             </ul>
 822 |           </li>
 823 |         
 824 |           <li class="archive-module-year archive-module-year-hidden" data-year="2016">
 825 |             <div class="archive-module-button">
 826 |               <span class="archive-module-hide-button">▼</span>
 827 |               <span class="archive-module-show-button">▶</span>
 828 |             </div>
 829 |             <a href="http://kanji.hatenablog.jp/archive/2016" class="archive-module-year-title">
 830 |               2016 (12)
 831 |             </a>
 832 |             <ul class="archive-module-months">
 833 |               
 834 |                 <li class="archive-module-month">
 835 |                   <a href="http://kanji.hatenablog.jp/archive/2016/11" class="archive-module-month-title">
 836 |                     2016 / 11 (1)
 837 |                   </a>
 838 |                 </li>
 839 |               
 840 |                 <li class="archive-module-month">
 841 |                   <a href="http://kanji.hatenablog.jp/archive/2016/10" class="archive-module-month-title">
 842 |                     2016 / 10 (8)
 843 |                   </a>
 844 |                 </li>
 845 |               
 846 |                 <li class="archive-module-month">
 847 |                   <a href="http://kanji.hatenablog.jp/archive/2016/9" class="archive-module-month-title">
 848 |                     2016 / 9 (3)
 849 |                   </a>
 850 |                 </li>
 851 |               
 852 |             </ul>
 853 |           </li>
 854 |         
 855 |       </ul>
 856 |     
 857 |   
 858 | 
 859 | 
 860 | </div>
 861 | </div>
 862 | 
 863 |     
 864 |       
 865 | 
 866 | <div class="hatena-module hatena-module-category">
 867 |   <div class="hatena-module-title">
 868 |     カテゴリー
 869 |   </div>
 870 |   <div class="hatena-module-body">
 871 |     <ul class="hatena-urllist">
 872 |       
 873 |         <li>
 874 |           <a href="http://kanji.hatenablog.jp/archive/category/%E8%A8%80%E8%AA%9E%E5%87%A6%E7%90%86">
 875 |             言語処理 (4)
 876 |           </a>
 877 |         </li>
 878 |       
 879 |         <li>
 880 |           <a href="http://kanji.hatenablog.jp/archive/category/Linux">
 881 |             Linux (3)
 882 |           </a>
 883 |         </li>
 884 |       
 885 |         <li>
 886 |           <a href="http://kanji.hatenablog.jp/archive/category/zsh">
 887 |             zsh (1)
 888 |           </a>
 889 |         </li>
 890 |       
 891 |         <li>
 892 |           <a href="http://kanji.hatenablog.jp/archive/category/%E3%82%B7%E3%82%A7%E3%83%AB%E3%82%B9%E3%82%AF%E3%83%AA%E3%83%97%E3%83%88">
 893 |             シェルスクリプト (1)
 894 |           </a>
 895 |         </li>
 896 |       
 897 |         <li>
 898 |           <a href="http://kanji.hatenablog.jp/archive/category/Python">
 899 |             Python (1)
 900 |           </a>
 901 |         </li>
 902 |       
 903 |         <li>
 904 |           <a href="http://kanji.hatenablog.jp/archive/category/%E6%AD%A3%E8%A6%8F%E8%A1%A8%E7%8F%BE">
 905 |             正規表現 (2)
 906 |           </a>
 907 |         </li>
 908 |       
 909 |         <li>
 910 |           <a href="http://kanji.hatenablog.jp/archive/category/%E6%96%87%E6%9B%B8%E5%88%86%E9%A1%9E">
 911 |             文書分類 (1)
 912 |           </a>
 913 |         </li>
 914 |       
 915 |         <li>
 916 |           <a href="http://kanji.hatenablog.jp/archive/category/%E6%A9%9F%E6%A2%B0%E5%AD%A6%E7%BF%92">
 917 |             機械学習 (1)
 918 |           </a>
 919 |         </li>
 920 |       
 921 |         <li>
 922 |           <a href="http://kanji.hatenablog.jp/archive/category/%E6%A9%9F%E6%A2%B0%E7%BF%BB%E8%A8%B3">
 923 |             機械翻訳 (1)
 924 |           </a>
 925 |         </li>
 926 |       
 927 |         <li>
 928 |           <a href="http://kanji.hatenablog.jp/archive/category/NFS">
 929 |             NFS (1)
 930 |           </a>
 931 |         </li>
 932 |       
 933 |         <li>
 934 |           <a href="http://kanji.hatenablog.jp/archive/category/CentOS">
 935 |             CentOS (1)
 936 |           </a>
 937 |         </li>
 938 |       
 939 |         <li>
 940 |           <a href="http://kanji.hatenablog.jp/archive/category/CUDA">
 941 |             CUDA (1)
 942 |           </a>
 943 |         </li>
 944 |       
 945 |         <li>
 946 |           <a href="http://kanji.hatenablog.jp/archive/category/perl">
 947 |             perl (1)
 948 |           </a>
 949 |         </li>
 950 |       
 951 |         <li>
 952 |           <a href="http://kanji.hatenablog.jp/archive/category/%E3%82%BB%E3%82%AD%E3%83%A5%E3%83%AA%E3%83%86%E3%82%A3%E3%83%BC">
 953 |             セキュリティー (1)
 954 |           </a>
 955 |         </li>
 956 |       
 957 |         <li>
 958 |           <a href="http://kanji.hatenablog.jp/archive/category/%E7%A0%94%E7%A9%B6">
 959 |             研究 (1)
 960 |           </a>
 961 |         </li>
 962 |       
 963 |     </ul>
 964 |   </div>
 965 | </div>
 966 | 
 967 |     
 968 |     
 969 |   </div>
 970 | </aside>
 971 | 
 972 | 
 973 |   </div>
 974 | </div>
 975 | 
 976 | 
 977 | 
 978 | 
 979 |         
 980 | 
 981 |         
 982 |   <script type="text/javascript" src="./blog_files/hatena_dfp2.js.ダウンロード"></script>
 983 | 
 984 | 
 985 |         
 986 | 
 987 |       </div>
 988 |     </div>
 989 |     
 990 | <footer id="footer" data-brand="hatenablog">
 991 |   <div id="footer-inner">
 992 |     
 993 |       <div style="display:none !important" class="guest-footer js-guide-register test-blogs-register-guide" data-action="guide-register">
 994 |   <div class="guest-footer-content">
 995 |     <h3>はてなブログをはじめよう！</h3>
 996 |     <p>kanjirz50さんは、はてなブログを使っています。あなたもはてなブログをはじめてみませんか？</p>
 997 |     <div class="guest-footer-btn-container">
 998 |       <div class="guest-footer-btn">
 999 |         <a class="btn btn-register" href="http://blog.hatena.ne.jp/register?via=200227" target="_blank">はてなブログをはじめる（無料）</a>
1000 |       </div>
1001 |       <div class="guest-footer-btn">
1002 |         <a href="http://hatenablog.com/guide" target="_blank">はてなブログとは</a>
1003 |       </div>
1004 |     </div>
1005 |   </div>
1006 | </div>
1007 | 
1008 |     
1009 |     <address class="footer-address">
1010 |       <a href="http://kanji.hatenablog.jp/">
1011 |         <img src="./blog_files/https_%2F%2Fcdn.user.blog.st-hatena.com%2Fcustom_blog_icon%2F125871161%2F1514187551722936" width="16" height="16" alt="かんちゃんの備忘録">
1012 |         <span class="footer-address-name">かんちゃんの備忘録</span>
1013 |       </a>
1014 |     </address>
1015 |     <p class="services">
1016 |       Powered by <a href="http://hatenablog.com/">Hatena Blog</a>
1017 |       |
1018 |         <a href="https://blog.hatena.ne.jp/-/abuse_report?target_url=http%3A%2F%2Fkanji.hatenablog.jp%2Fentry%2Fpython-xonsh-try" class="report-abuse-link test-report-abuse-link" target="_blank">ブログを報告する</a>
1019 |     </p>
1020 |   </div>
1021 | </footer>
1022 | 
1023 | 
1024 |     
1025 | 
1026 |     
1027 |   <script src="./blog_files/HatenaStar.js.ダウンロード"></script>
1028 | 
1029 | 
1030 |     
1031 |       <div id="fb-root" class=" fb_reset"><div style="position: absolute; top: -10000px; height: 0px; width: 0px;"><div><iframe name="fb_xdm_frame_http" frameborder="0" allowtransparency="true" allowfullscreen="true" scrolling="no" id="fb_xdm_frame_http" aria-hidden="true" title="Facebook Cross Domain Communication Frame" tabindex="-1" src="./blog_files/lY4eZXm_YWu.html" style="border: none;"></iframe><iframe name="fb_xdm_frame_https" frameborder="0" allowtransparency="true" allowfullscreen="true" scrolling="no" id="fb_xdm_frame_https" aria-hidden="true" title="Facebook Cross Domain Communication Frame" tabindex="-1" src="./blog_files/lY4eZXm_YWu(1).html" style="border: none;"></iframe></div></div><div style="position: absolute; top: -10000px; height: 0px; width: 0px;"><div></div></div></div>
1032 | <script>(function(d, s, id) {
1033 |   var js, fjs = d.getElementsByTagName(s)[0];
1034 |   if (d.getElementById(id)) return;
1035 |   js = d.createElement(s); js.id = id;
1036 |   js.src = "//connect.facebook.net/ja_JP/sdk.js#xfbml=1&appId=719729204785177&version=v2.7";
1037 |   fjs.parentNode.insertBefore(js, fjs);
1038 | }(document, 'script', 'facebook-jssdk'));</script>
1039 | 
1040 |     
1041 |     
1042 | 
1043 | <div class="quote-box" style="display: none;">
1044 |   <div class="tooltip-quote tooltip-quote-star" style="display: block;">
1045 |     <i class="blogicon-star" title="引用スターをつける"></i>
1046 |   </div>
1047 |   <div class="tooltip-quote tooltip-quote-stock" style="display: block;">
1048 |     <i class="blogicon-quote" title="引用をストック"></i>
1049 |   </div>
1050 |   <div class="tooltip-quote tooltip-quote-tweet js-tooltip-quote-tweet">
1051 |     <a class="js-tweet-quote" target="_blank" data-track-name="quote-tweet" data-track-once=""><i class="blogicon-twitter" title="引用してツイートする"></i></a>
1052 |   </div>
1053 | </div>
1054 | 
1055 | <div class="message-box" id="quote-star-message-box" style="display: none; position: absolute;">
1056 |   スターをつけました
1057 | </div>
1058 | 
1059 | <div class="quote-stock-panel" id="quote-stock-message-box" style="position: absolute; z-index: 3000">
1060 |   <div class="message-box" id="quote-stock-succeeded-message" style="display: none">
1061 |     <p>引用をストックしました</p>
1062 |     <button class="btn btn-primary" id="quote-stock-show-editor-button" data-track-name="curation-quote-edit-button">ストック一覧を見る</button>
1063 |     <button class="btn quote-stock-close-message-button">閉じる</button>
1064 |   </div>
1065 | 
1066 |   <div class="message-box" id="quote-login-required-message" style="display: none">
1067 |     <p>引用するにはまずログインしてください</p>
1068 |     <button class="btn btn-primary" id="quote-login-button">ログイン</button>
1069 |     <button class="btn quote-stock-close-message-button">閉じる</button>
1070 |   </div>
1071 | 
1072 |   <div class="error-box" id="quote-stock-failed-message" style="display: none">
1073 |     <p>引用をストックできませんでした。再度お試しください</p>
1074 |     <button class="btn quote-stock-close-message-button">閉じる</button>
1075 |   </div>
1076 | 
1077 |   <div class="error-box" id="unstockable-quote-message-box" style="display: none; position: absolute; z-index: 3000;">
1078 |     <p>限定公開記事のため引用できません。</p>
1079 |   </div>
1080 | </div>
1081 | 
1082 | <script type="x-underscore-template" id="js-requote-button-template">
1083 |   <div class="requote-button js-requote-button">
1084 |     <button class="requote-button-btn tipsy-top" title="引用する"><i class="blogicon-quote"></i></button>
1085 |   </div>
1086 | </script>
1087 | 
1088 | 
1089 | 
1090 |     
1091 |     <div id="hidden-subscribe-button" style="display: none;">
1092 |       <div class="hatena-follow-button-box btn-subscribe js-hatena-follow-button-box">
1093 | 
1094 |   <a href="http://kanji.hatenablog.jp/entry/python-xonsh-try#" class="hatena-follow-button js-hatena-follow-button unsubscribing">
1095 |     <span class="subscribing">
1096 |       <span class="foreground">読者です</span>
1097 |       <span class="background">読者をやめる</span>
1098 |     </span>
1099 |     <span class="unsubscribing" data-track-name="profile-widget-subscribe-button" data-track-once="">
1100 |       <span class="foreground">読者になる</span>
1101 |       <span class="background">読者になる</span>
1102 |     </span>
1103 |   </a>
1104 |   <div class="subscription-count-box js-subscription-count-box" style="display: block;">
1105 |     <i></i>
1106 |     <u></u>
1107 |     <span class="subscription-count js-subscription-count">6</span>
1108 |   </div>
1109 | </div>
1110 | 
1111 |     </div>
1112 | 
1113 |     
1114 |   <script type="text/javascript" src="./blog_files/widgets.js.ダウンロード"></script>
1115 | 
1116 | <script src="./blog_files/platform.js.ダウンロード" async="" defer="" gapi_processed="true">
1117 |   { lang: 'ja', "parsetags": "explicit" }
1118 | </script>
1119 | <script type="text/javascript" src="./blog_files/bookmark_button.js.ダウンロード" charset="utf-8" async="async"></script>
1120 | 
1121 | 
1122 | 
1123 |   <script type="text/javascript" src="./blog_files/react-with-addons.min.js.ダウンロード"></script>
1124 |   <script type="text/javascript" src="./blog_files/react-dom.min.js.ダウンロード"></script>
1125 | 
1126 | 
1127 | <script type="text/javascript" src="./blog_files/jquery.min.js.ダウンロード"></script>
1128 | <script type="text/javascript" src="./blog_files/jquery-ui.1.10.0.custom.min.js.ダウンロード"></script>
1129 | <script type="text/javascript" src="./blog_files/jquery.flot.js.ダウンロード"></script>
1130 | <script type="text/javascript" src="./blog_files/jquery.flot.time.js.ダウンロード"></script>
1131 | 
1132 | 
1133 | 
1134 | 
1135 | <script id="hatenablog-js" data-env="production" type="text/javascript" src="./blog_files/hatenablog.js.ダウンロード" crossorigin="anonymous"></script><div style="position: fixed; top: 0px; left: 0px; width: 100%; height: 100%; display: none;"></div>
1136 | <script type="text/javascript" src="./blog_files/texts-ja.js.ダウンロード"></script>
1137 | 
1138 | 
1139 |   <script type="text/javascript">Hatena.Diary.GlobalHeader.init()</script>
1140 | 
1141 | 
1142 | <script src="./blog_files/api.js.ダウンロード" async="" defer=""></script>
1143 | 
1144 | 
1145 | 
1146 | 
1147 |     
1148 | 
1149 | 
1150 | 
1151 | 
1152 | 
1153 |   
1154 | 
1155 | 
1156 | <iframe scrolling="no" frameborder="0" allowtransparency="true" src="./blog_files/widget_iframe.83d5793f6ebbe2046330abda6016ae93.html" style="display: none;"></iframe><div id="cboxOverlay" style="display: none;"></div><div id="colorbox" class="" role="dialog" tabindex="-1" style="display: none;"><div id="cboxWrapper"><div><div id="cboxTopLeft" style="float: left;"></div><div id="cboxTopCenter" style="float: left;"></div><div id="cboxTopRight" style="float: left;"></div></div><div style="clear: left;"><div id="cboxMiddleLeft" style="float: left;"></div><div id="cboxContent" style="float: left;"><div id="cboxTitle" style="float: left;"></div><div id="cboxCurrent" style="float: left;"></div><button type="button" id="cboxPrevious"></button><button type="button" id="cboxNext"></button><button type="button" id="cboxSlideshow"></button><div id="cboxLoadingOverlay" style="float: left;"></div><div id="cboxLoadingGraphic" style="float: left;"></div></div><div id="cboxMiddleRight" style="float: left;"></div></div><div style="clear: left;"><div id="cboxBottomLeft" style="float: left;"></div><div id="cboxBottomCenter" style="float: left;"></div><div id="cboxBottomRight" style="float: left;"></div></div></div><div style="position: absolute; width: 9999px; visibility: hidden; display: none; max-width: none;"></div></div><div style="top: -9999px; z-index: -9999;"></div><script type="text/javascript" charset="UTF-8">!function(t,e){if(void 0===e[t]){e[t]=function(){e[t].clients.push(this),this._init=[Array.prototype.slice.call(arguments)]},e[t].clients=[];for(var r=function(t){return function(){return this["_"+t]=this["_"+t]||[],this["_"+t].push(Array.prototype.slice.call(arguments)),this}},s=["addRecord","set","trackEvent","trackPageview","trackClicks","ready"],a=0;a<s.length;a++){var c=s[a];e[t].prototype[c]=r(c)}var n=document.createElement("script");n.type="text/javascript",n.async=!0,n.src=("https:"===document.location.protocol?"https:":"http:")+"//cdn.treasuredata.com/sdk/1.7.2/td.min.js";var i=document.getElementsByTagName("script")[0];i.parentNode.insertBefore(n,i)}}("Treasure",this);</script><script type="text/javascript" charset="UTF-8" src="./blog_files/aid"></script><script type="text/javascript" charset="UTF-8">!function(t,e){if(void 0===e[t]){e[t]=function(){e[t].clients.push(this),this._init=[Array.prototype.slice.call(arguments)]},e[t].clients=[];for(var r=function(t){return function(){return this["_"+t]=this["_"+t]||[],this["_"+t].push(Array.prototype.slice.call(arguments)),this}},s=["addRecord","set","trackEvent","trackPageview","trackClicks","ready"],a=0;a<s.length;a++){var c=s[a];e[t].prototype[c]=r(c)}var n=document.createElement("script");n.type="text/javascript",n.async=!0,n.src=("https:"===document.location.protocol?"https:":"http:")+"//cdn.treasuredata.com/sdk/1.7.2/td.min.js";var i=document.getElementsByTagName("script")[0];i.parentNode.insertBefore(n,i)}}("Treasure",this);</script><script type="text/javascript" charset="UTF-8" src="./blog_files/aid"></script><script type="text/javascript" charset="UTF-8">!function(t,e){if(void 0===e[t]){e[t]=function(){e[t].clients.push(this),this._init=[Array.prototype.slice.call(arguments)]},e[t].clients=[];for(var r=function(t){return function(){return this["_"+t]=this["_"+t]||[],this["_"+t].push(Array.prototype.slice.call(arguments)),this}},s=["addRecord","set","trackEvent","trackPageview","trackClicks","ready"],a=0;a<s.length;a++){var c=s[a];e[t].prototype[c]=r(c)}var n=document.createElement("script");n.type="text/javascript",n.async=!0,n.src=("https:"===document.location.protocol?"https:":"http:")+"//cdn.treasuredata.com/sdk/1.7.2/td.min.js";var i=document.getElementsByTagName("script")[0];i.parentNode.insertBefore(n,i)}}("Treasure",this);</script><script type="text/javascript" charset="UTF-8" src="./blog_files/aid"></script><script type="text/javascript" charset="UTF-8">!function(t,e){if(void 0===e[t]){e[t]=function(){e[t].clients.push(this),this._init=[Array.prototype.slice.call(arguments)]},e[t].clients=[];for(var r=function(t){return function(){return this["_"+t]=this["_"+t]||[],this["_"+t].push(Array.prototype.slice.call(arguments)),this}},s=["addRecord","set","trackEvent","trackPageview","trackClicks","ready"],a=0;a<s.length;a++){var c=s[a];e[t].prototype[c]=r(c)}var n=document.createElement("script");n.type="text/javascript",n.async=!0,n.src=("https:"===document.location.protocol?"https:":"http:")+"//cdn.treasuredata.com/sdk/1.7.2/td.min.js";var i=document.getElementsByTagName("script")[0];i.parentNode.insertBefore(n,i)}}("Treasure",this);</script><script type="text/javascript" charset="UTF-8" src="./blog_files/aid"></script><iframe id="rufous-sandbox" scrolling="no" frameborder="0" allowtransparency="true" allowfullscreen="true" style="position: absolute; visibility: hidden; display: none; width: 0px; height: 0px; padding: 0px; border: none;" title="Twitter analytics iframe" src="./blog_files/saved_resource(5).html"></iframe><iframe id="google_osd_static_frame_9977886185948" name="google_osd_static_frame" style="display: none; width: 0px; height: 0px;" src="./blog_files/saved_resource(6).html"></iframe><img src="./blog_files/dmp" width="1" height="1" border="0" style="display: none;"><img src="./blog_files/pixel" width="1" height="1" border="0" style="display: none;"><img src="./blog_files/adsct" width="1" height="1" border="0" style="display: none;"><script>(function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0],j=d.createElement(s),dl=l!='dataLayer'?'&l='+l:'';j.async=true;j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P5GX4M');</script><iframe src="./blog_files/pd.html" width="0" height="0" style="display:none;"></iframe><div style="display: none; visibility: hidden;"><script type="text/javascript">!function(c,d,b,f){if(!d[c]){d[c]=function(){d[c].instances.push(this);this.init&&this.init()};d[c].instances=[];for(var a=0,e=["td_send","td_send_imid"];a<e.length;a++)d[c].prototype[e[a]]=function(a){return function(){this["tmp_"+a]=this["tmp_"+a]||[];this["tmp_"+a].push(Array.prototype.slice.call(arguments))}}(e[a]);a=b.getElementsByTagName(f)[0];b=b.createElement(f);b.async=!0;b.src="//cf.im-apps.net/sdk/tdim-0.11.2.js";a.parentNode.insertBefore(b,a)}}("TDIM",window,document,"script");var t=new TDIM;
1157 | t.td_api_key="312/b4f0042d7c26b4f44d2561bbb5c396349b54b10e";t.td_db="cosmi_8045";t.im_api_token="omO0CDJd98sxiIkb8Mzm7Q";t.gtm_dl="dataLayer";t.td_send_imid("pageviews");</script></div><div style="display: none; visibility: hidden;">
1158 | <script src="./blog_files/oct.js.ダウンロード" type="text/javascript"></script>
1159 | <script type="text/javascript">twttr.conversion.trackPid("nudt9",{tw_sale_amount:0,tw_order_quantity:0});</script>
1160 | <noscript></noscript>
1161 | </div><div style="display: none; visibility: hidden;">
1162 | <script src="./blog_files/oct.js.ダウンロード" type="text/javascript"></script>
1163 | <script type="text/javascript">twttr.conversion.trackPid("nv3b2",{tw_sale_amount:0,tw_order_quantity:0});</script>
1164 | <noscript></noscript>
1165 | </div><div style="display: none; visibility: hidden;"><script type="text/javascript">var _fout_queue=_fout_queue||{};void 0===_fout_queue.segment&&(_fout_queue.segment={});void 0===_fout_queue.segment.queue&&(_fout_queue.segment.queue=[]);_fout_queue.segment.queue.push({user_id:10595,advertiser_id:1808,contractor_id:5});(function(){var a=document.createElement("script");a.type="text/javascript";a.async=!0;a.src=("https:"==document.location.protocol?"https://":"http://")+"js.fout.jp/segmentation.js";var b=document.getElementsByTagName("script")[0];b.parentNode.insertBefore(a,b)})();</script>
1166 |     </div><div style="display: none; visibility: hidden;">
1167 | <script>!function(d,e,f,a,b,c){d.twq||(a=d.twq=function(){a.exe?a.exe.apply(a,arguments):a.queue.push(arguments)},a.version="1.1",a.queue=[],b=e.createElement(f),b.async=!0,b.src="//static.ads-twitter.com/uwt.js",c=e.getElementsByTagName(f)[0],c.parentNode.insertBefore(b,c))}(window,document,"script");twq("init","ny5vy");twq("track","PageView");</script>
1168 | </div><div style="display: none; visibility: hidden;">
1169 | <script>!function(b,e,f,g,a,c,d){b.fbq||(a=b.fbq=function(){a.callMethod?a.callMethod.apply(a,arguments):a.queue.push(arguments)},b._fbq||(b._fbq=a),a.push=a,a.loaded=!0,a.version="2.0",a.queue=[],c=e.createElement(f),c.async=!0,c.src=g,d=e.getElementsByTagName(f)[0],d.parentNode.insertBefore(c,d))}(window,document,"script","https://connect.facebook.net/en_US/fbevents.js");fbq("init","1733466696949178");fbq("track","PageView");</script>
1170 | <noscript></noscript>
1171 | 
1172 | 
1173 | </div><script src="./blog_files/adsct(1)" type="text/javascript"></script><script src="./blog_files/adsct(2)" type="text/javascript"></script><iframe src="./blog_files/beacon.html" style="display: none;"></iframe><script src="./blog_files/adsct(3)" type="text/javascript"></script></body></html>


--------------------------------------------------------------------------------
/tests/test_extractcontent3.py:
--------------------------------------------------------------------------------
 1 | """
 2 | Test
 3 | """
 4 | 
 5 | import pytest
 6 | from extractcontent3 import ExtractContent
 7 | 
 8 | class TestExtractContentHatenaBlog(object):
 9 |     @pytest.fixture()
10 |     def extractor(self):
11 |         html = open("./tests/blog.html").read()
12 |         extractor = ExtractContent()
13 |         extractor.analyse(html)
14 |         return extractor
15 | 
16 |     def test_text(self, extractor):
17 |         text, title = extractor.as_text()
18 |         assert text.strip().startswith("【Xonsh Advent Calendar 2017の13日目の記事です。】")
19 | 
20 |     def test_title(self, extractor):
21 |         text, title = extractor.as_text()
22 |         assert title == "Xonshを使ってみた - かんちゃんの備忘録"
23 | 


--------------------------------------------------------------------------------