├── .gitignore
├── README.md
├── luigi
    ├── data
    │   └── .gitkeep
    ├── logging.conf
    ├── luigi.cfg
    ├── model
    │   └── .gitkeep
    ├── sample_luigi.ipynb
    └── sample_luigi.py
├── mlflow
    ├── output.txt
    └── sample.py
├── nlp
    ├── swem.py
    ├── test_nlplot
    │   ├── 2020-08-08_pyldavis.html
    │   ├── introduction_nlplot_twitter.ipynb
    │   ├── unigram #データサイエンティストvs#kaggle.html
    │   └── words distribution #データサイエンティストvs#kaggle.html
    └── twitter_analytics_using_nlplot
    │   ├── .DS_Store
    │   ├── 2020-05-17_Co-occurrence network.html
    │   ├── 2020-05-17_Tree of Most Common Words.html
    │   ├── 2020-05-17_bi-gram.html
    │   ├── 2020-05-17_number of words distribution.html
    │   ├── 2020-05-17_pyldavis.html
    │   ├── 2020-05-17_sunburst chart.html
    │   ├── 2020-05-17_tri-gram.html
    │   ├── 2020-05-17_uni-gram.html
    │   ├── 2020-05-18_pyldavis.html
    │   ├── 2020-05-19_pyldavis.html
    │   ├── TwitterScraper.ipynb
    │   ├── introduction_nlplot_twitter.html
    │   ├── introduction_nlplot_twitter.ipynb
    │   ├── merge_data.ipynb
    │   ├── sample_twitter.csv
    │   ├── unigram #データサイエンティストvs#kaggle.html
    │   ├── wordcloud.png
    │   └── words distribution #データサイエンティストvs#kaggle.html
├── other
    └── hatenablog_css
    │   └── design.css
├── recommendation
    ├── graph
    │   ├── keras_tutorial.ipynb
    │   └── ml-latest-small
    │   │   └── README.txt
    └── matrix_factorization
    │   ├── data
    │       └── ml-25m
    │       │   └── README.txt
    │   └── keras_matrix_factorization.ipynb
└── streamlit
    └── sample.py


/.gitignore:
--------------------------------------------------------------------------------
  1 | # Created by https://www.gitignore.io/api/code,linux,macos,python,pycharm,windows,jupyternotebooks
  2 | # Edit at https://www.gitignore.io/?templates=code,linux,macos,python,pycharm,windows,jupyternotebooks
  3 | 
  4 | ### Code ###
  5 | .vscode/*
  6 | !.vscode/settings.json
  7 | !.vscode/tasks.json
  8 | !.vscode/launch.json
  9 | !.vscode/extensions.json
 10 | 
 11 | ### JupyterNotebooks ###
 12 | # gitignore template for Jupyter Notebooks
 13 | # website: http://jupyter.org/
 14 | 
 15 | .ipynb_checkpoints
 16 | */.ipynb_checkpoints/*
 17 | 
 18 | # IPython
 19 | profile_default/
 20 | ipython_config.py
 21 | 
 22 | # Remove previous ipynb_checkpoints
 23 | #   git rm -r .ipynb_checkpoints/
 24 | 
 25 | ### Linux ###
 26 | *~
 27 | 
 28 | # temporary files which can be created if a process still has a handle open of a deleted file
 29 | .fuse_hidden*
 30 | 
 31 | # KDE directory preferences
 32 | .directory
 33 | 
 34 | # Linux trash folder which might appear on any partition or disk
 35 | .Trash-*
 36 | 
 37 | # .nfs files are created when an open file is removed but is still being accessed
 38 | .nfs*
 39 | 
 40 | ### macOS ###
 41 | # General
 42 | .DS_Store
 43 | .AppleDouble
 44 | .LSOverride
 45 | 
 46 | # Icon must end with two \r
 47 | Icon
 48 | 
 49 | # Thumbnails
 50 | ._*
 51 | 
 52 | # Files that might appear in the root of a volume
 53 | .DocumentRevisions-V100
 54 | .fseventsd
 55 | .Spotlight-V100
 56 | .TemporaryItems
 57 | .Trashes
 58 | .VolumeIcon.icns
 59 | .com.apple.timemachine.donotpresent
 60 | 
 61 | # Directories potentially created on remote AFP share
 62 | .AppleDB
 63 | .AppleDesktop
 64 | Network Trash Folder
 65 | Temporary Items
 66 | .apdisk
 67 | 
 68 | ### PyCharm ###
 69 | # Covers JetBrains IDEs: IntelliJ, RubyMine, PhpStorm, AppCode, PyCharm, CLion, Android Studio and WebStorm
 70 | # Reference: https://intellij-support.jetbrains.com/hc/en-us/articles/206544839
 71 | 
 72 | # User-specific stuff
 73 | .idea/**/workspace.xml
 74 | .idea/**/tasks.xml
 75 | .idea/**/usage.statistics.xml
 76 | .idea/**/dictionaries
 77 | .idea/**/shelf
 78 | 
 79 | # Generated files
 80 | .idea/**/contentModel.xml
 81 | 
 82 | # Sensitive or high-churn files
 83 | .idea/**/dataSources/
 84 | .idea/**/dataSources.ids
 85 | .idea/**/dataSources.local.xml
 86 | .idea/**/sqlDataSources.xml
 87 | .idea/**/dynamic.xml
 88 | .idea/**/uiDesigner.xml
 89 | .idea/**/dbnavigator.xml
 90 | 
 91 | # Gradle
 92 | .idea/**/gradle.xml
 93 | .idea/**/libraries
 94 | 
 95 | # Gradle and Maven with auto-import
 96 | # When using Gradle or Maven with auto-import, you should exclude module files,
 97 | # since they will be recreated, and may cause churn.  Uncomment if using
 98 | # auto-import.
 99 | # .idea/modules.xml
100 | # .idea/*.iml
101 | # .idea/modules
102 | # *.iml
103 | # *.ipr
104 | 
105 | # CMake
106 | cmake-build-*/
107 | 
108 | # Mongo Explorer plugin
109 | .idea/**/mongoSettings.xml
110 | 
111 | # File-based project format
112 | *.iws
113 | 
114 | # IntelliJ
115 | out/
116 | 
117 | # mpeltonen/sbt-idea plugin
118 | .idea_modules/
119 | 
120 | # JIRA plugin
121 | atlassian-ide-plugin.xml
122 | 
123 | # Cursive Clojure plugin
124 | .idea/replstate.xml
125 | 
126 | # Crashlytics plugin (for Android Studio and IntelliJ)
127 | com_crashlytics_export_strings.xml
128 | crashlytics.properties
129 | crashlytics-build.properties
130 | fabric.properties
131 | 
132 | # Editor-based Rest Client
133 | .idea/httpRequests
134 | 
135 | # Android studio 3.1+ serialized cache file
136 | .idea/caches/build_file_checksums.ser
137 | 
138 | ### PyCharm Patch ###
139 | # Comment Reason: https://github.com/joeblau/gitignore.io/issues/186#issuecomment-215987721
140 | 
141 | # *.iml
142 | # modules.xml
143 | # .idea/misc.xml
144 | # *.ipr
145 | 
146 | # Sonarlint plugin
147 | .idea/**/sonarlint/
148 | 
149 | # SonarQube Plugin
150 | .idea/**/sonarIssues.xml
151 | 
152 | # Markdown Navigator plugin
153 | .idea/**/markdown-navigator.xml
154 | .idea/**/markdown-navigator/
155 | 
156 | ### Python ###
157 | # Byte-compiled / optimized / DLL files
158 | __pycache__/
159 | *.py[cod]
160 | *$py.class
161 | 
162 | # C extensions
163 | *.so
164 | 
165 | # Distribution / packaging
166 | .Python
167 | build/
168 | develop-eggs/
169 | dist/
170 | downloads/
171 | eggs/
172 | .eggs/
173 | lib/
174 | lib64/
175 | parts/
176 | sdist/
177 | var/
178 | wheels/
179 | pip-wheel-metadata/
180 | share/python-wheels/
181 | *.egg-info/
182 | .installed.cfg
183 | *.egg
184 | MANIFEST
185 | 
186 | # PyInstaller
187 | #  Usually these files are written by a python script from a template
188 | #  before PyInstaller builds the exe, so as to inject date/other infos into it.
189 | *.manifest
190 | *.spec
191 | 
192 | # Installer logs
193 | pip-log.txt
194 | pip-delete-this-directory.txt
195 | 
196 | # Unit test / coverage reports
197 | htmlcov/
198 | .tox/
199 | .nox/
200 | .coverage
201 | .coverage.*
202 | .cache
203 | nosetests.xml
204 | coverage.xml
205 | *.cover
206 | .hypothesis/
207 | .pytest_cache/
208 | 
209 | # Translations
210 | *.mo
211 | *.pot
212 | 
213 | # Scrapy stuff:
214 | .scrapy
215 | 
216 | # Sphinx documentation
217 | docs/_build/
218 | 
219 | # PyBuilder
220 | target/
221 | 
222 | # pyenv
223 | .python-version
224 | 
225 | # pipenv
226 | #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
227 | #   However, in case of collaboration, if having platform-specific dependencies or dependencies
228 | #   having no cross-platform support, pipenv may install dependencies that don't work, or not
229 | #   install all needed dependencies.
230 | #Pipfile.lock
231 | 
232 | # celery beat schedule file
233 | celerybeat-schedule
234 | 
235 | # SageMath parsed files
236 | *.sage.py
237 | 
238 | # Spyder project settings
239 | .spyderproject
240 | .spyproject
241 | 
242 | # Rope project settings
243 | .ropeproject
244 | 
245 | # Mr Developer
246 | .mr.developer.cfg
247 | .project
248 | .pydevproject
249 | 
250 | # mkdocs documentation
251 | /site
252 | 
253 | # mypy
254 | .mypy_cache/
255 | .dmypy.json
256 | dmypy.json
257 | 
258 | # Pyre type checker
259 | .pyre/
260 | 
261 | ### Windows ###
262 | # Windows thumbnail cache files
263 | Thumbs.db
264 | Thumbs.db:encryptable
265 | ehthumbs.db
266 | ehthumbs_vista.db
267 | 
268 | # Dump file
269 | *.stackdump
270 | 
271 | # Folder config file
272 | [Dd]esktop.ini
273 | 
274 | # Recycle Bin used on file shares
275 | $RECYCLE.BIN/
276 | 
277 | # Windows Installer files
278 | *.cab
279 | *.msi
280 | *.msix
281 | *.msm
282 | *.msp
283 | 
284 | # Windows shortcuts
285 | *.lnk
286 | 
287 | # End of https://www.gitignore.io/api/code,linux,macos,python,pycharm,windows,jupyternotebooks
288 | 
289 | .idea
290 | 
291 | # add
292 | *.csv
293 | *.tsv
294 | *.bz
295 | *.pkl
296 | *.pyc
297 | *.model
298 | *.png
299 | *.dat
300 | *.zip
301 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
1 | # takapy_blog
2 | 


--------------------------------------------------------------------------------
/luigi/data/.gitkeep:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/takapy0210/geek_blog/e36604f01d26f4d14bdacc6bb2995c929d49fdfa/luigi/data/.gitkeep


--------------------------------------------------------------------------------
/luigi/logging.conf:
--------------------------------------------------------------------------------
 1 | [loggers]
 2 | keys=root
 3 | 
 4 | [handlers]
 5 | keys=streamHandler
 6 | 
 7 | [logger_root]
 8 | level=INFO
 9 | handlers=streamHandler
10 | 
11 | [formatters]
12 | keys=simpleFormatter
13 | 
14 | [handler_streamHandler]
15 | class=logging.StreamHandler
16 | level=INFO
17 | formatter=simpleFormatter
18 | 
19 | [formatter_simpleFormatter]
20 | format=[%(asctime)s] [%(levelname)5s] %(message)s
21 | datefmt=%Y-%m-%d %H:%M:%S
22 | 


--------------------------------------------------------------------------------
/luigi/luigi.cfg:
--------------------------------------------------------------------------------
 1 | [core]
 2 | # 不要なログを出力しないための設定
 3 | log_level=INFO
 4 | logging_conf_file=logging.conf
 5 | 
 6 | [retcode]
 7 | # エラーを通知するための設定
 8 | already_running=10
 9 | missing_data=10
10 | not_run=10
11 | task_failed=10
12 | scheduling_error=10
13 | unhandled_exception=10
14 | 


--------------------------------------------------------------------------------
/luigi/model/.gitkeep:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/takapy0210/geek_blog/e36604f01d26f4d14bdacc6bb2995c929d49fdfa/luigi/model/.gitkeep


--------------------------------------------------------------------------------
/luigi/sample_luigi.py:
--------------------------------------------------------------------------------
  1 | import pickle
  2 | import warnings
  3 | import logging
  4 | 
  5 | import pandas as pd
  6 | import luigi
  7 | from luigi.util import requires
  8 | from sklearn import datasets
  9 | from sklearn.preprocessing import OneHotEncoder
 10 | from sklearn.model_selection import train_test_split
 11 | from sklearn.ensemble import RandomForestClassifier
 12 | from sklearn.metrics import classification_report, accuracy_score
 13 | 
 14 | warnings.filterwarnings("ignore")
 15 | logger = logging.getLogger()
 16 | 
 17 | 
 18 | class LoadDataset(luigi.Task):
 19 |     """データセットをロードするクラス"""
 20 |     task_namespace = 'titanic_tasks'
 21 | 
 22 |     def output(self):
 23 |         # return luigi.LocalTarget("data/titanic.csv")  # csvで出力する場合
 24 |         return luigi.LocalTarget("data/titanic.pkl", format=luigi.format.Nop)
 25 | 
 26 |     def run(self):
 27 |         # titanicデータの読み込み
 28 |         df = datasets.fetch_openml("titanic", version=1, as_frame=True, return_X_y=False).frame
 29 |         logger.info(f'Data shape: {df.shape}')
 30 | 
 31 |         # pklで出力する
 32 |         with self.output().open('w') as f:
 33 |             f.write(pickle.dumps(df, protocol=pickle.HIGHEST_PROTOCOL))
 34 | 
 35 |         # csvで出力したい場合は普通にpandasで出力する
 36 |         # 型が崩れる可能性があるので非推奨ではある
 37 |         # df.to_csv("data/titanic.csv", index=False)
 38 | 
 39 | 
 40 | @requires(LoadDataset)
 41 | class Processing(luigi.Task):
 42 |     """データの加工を行う"""
 43 |     task_namespace = 'titanic_tasks'
 44 | 
 45 |     def output(self):
 46 |         # return luigi.LocalTarget("data/processing_titanic.csv")  # csvで出力する場合
 47 |         return luigi.LocalTarget("data/processing_titanic.pkl", format=luigi.format.Nop)
 48 | 
 49 |     def run(self):
 50 |         # データの読み込み
 51 |         with self.input().open() as f:
 52 |             # df = pd.read_csv(f)  # pandasで読み込むパターン
 53 |             df = pickle.load(f)  # pickleで読み込むパターン
 54 |         logger.info(f'Before Data shape: {df.shape}')
 55 | 
 56 |         # 欠損値処理
 57 |         df.loc[:, 'age'] = df['age'].fillna(df['age'].mean())
 58 |         df.loc[:, 'fare'] = df['fare'].fillna(df['fare'].mean())
 59 | 
 60 |         # カテゴリエンコード
 61 |         categorical_cols = ["pclass", "sex", "embarked"]
 62 |         df = self.sklearn_oh_encoder(df=df, cols=categorical_cols, drop_col=True)
 63 |         logger.info(f'After Data shape: {df.shape}')
 64 | 
 65 |         # 学習に使用するカラムのみを出力
 66 |         use_cols = [
 67 |             'survived',
 68 |             'age',
 69 |             'sibsp',
 70 |             'parch',
 71 |             'fare',
 72 |             'pclass_1.0',
 73 |             'pclass_2.0',
 74 |             'pclass_3.0',
 75 |             'sex_female',
 76 |             'sex_male',
 77 |             'embarked_C',
 78 |             'embarked_Q',
 79 |             'embarked_S',
 80 |             'embarked_nan'
 81 |         ]
 82 |         df = df[use_cols]
 83 | 
 84 |         # 保存
 85 |         with self.output().open('w') as f:
 86 |             f.write(pickle.dumps(df, protocol=pickle.HIGHEST_PROTOCOL))
 87 | 
 88 |     def sklearn_oh_encoder(self, df, cols, drop_col=False):
 89 |         """カテゴリ変換
 90 |         sklearnのOneHotEncoderでEncodingを行う
 91 | 
 92 |         Args:
 93 |             df: カテゴリ変換する対象のデータフレーム
 94 |             cols (list of str): カテゴリ変換する対象のカラムリスト
 95 |             drop_col (bool): エンコード対象のカラムを削除するか否か
 96 | 
 97 |         Returns:
 98 |             pd.Dataframe: dfにカテゴリ変換したカラムを追加したデータフレーム
 99 |         """
100 |         output_df = df.copy()
101 |         for col in cols:
102 |             ohe = OneHotEncoder(sparse=False, handle_unknown='ignore')
103 |             ohe_df = pd.DataFrame((ohe.fit_transform(output_df[[col]])), columns=ohe.categories_[0])
104 |             ohe_df = ohe_df.add_prefix(f'{col}_')
105 |             # 元のDFに結合
106 |             output_df = pd.concat([output_df, ohe_df], axis=1)
107 |             if drop_col:
108 |                 output_df = output_df.drop(col, axis=1)
109 |         return output_df
110 | 
111 | 
112 | @requires(Processing)
113 | class TrainTestSplit(luigi.Task):
114 |     """データを学習データと検証データに分割する"""
115 |     task_namespace = 'titanic_tasks'
116 | 
117 |     def output(self):
118 |         return [luigi.LocalTarget("data/processing_titanic_train.pkl", format=luigi.format.Nop),
119 |                 luigi.LocalTarget("data/processing_titanic_test.pkl", format=luigi.format.Nop)]
120 | 
121 |     def run(self):
122 |         # データの読み込み
123 |         with self.input().open() as f:
124 |             df = pickle.load(f)  # pickleで読み込むパターン
125 | 
126 |         train, test = train_test_split(df, test_size=0.3, shuffle=True, stratify=df['survived'], random_state=42)
127 |         logger.info(f'Train shape: {train.shape}')
128 |         logger.info(f'Test shape: {test.shape}')
129 | 
130 |         with self.output()[0].open('w') as f:
131 |             f.write(pickle.dumps(train, protocol=pickle.HIGHEST_PROTOCOL))
132 | 
133 |         with self.output()[1].open('w') as f:
134 |             f.write(pickle.dumps(test, protocol=pickle.HIGHEST_PROTOCOL))
135 | 
136 | 
137 | @requires(TrainTestSplit)
138 | class Training(luigi.Task):
139 |     """学習"""
140 |     task_namespace = 'titanic_tasks'
141 | 
142 |     def output(self):
143 |         return luigi.LocalTarget("model/random_forest.model", format=luigi.format.Nop)
144 | 
145 |     def run(self):
146 |         # データの読み込み
147 |         with self.input()[0].open() as f:
148 |             train = pickle.load(f)
149 | 
150 |         logger.info(f'Train shape: {train.shape}')
151 | 
152 |         target_col = 'survived'
153 |         X_train = train.drop(target_col, axis=1)
154 |         y_train = train[target_col]
155 | 
156 |         model = RandomForestClassifier(random_state=1)
157 |         model.fit(X_train, y_train)
158 | 
159 |         # 保存
160 |         with self.output().open('w') as f:
161 |             f.write(pickle.dumps(model, protocol=pickle.HIGHEST_PROTOCOL))
162 | 
163 | 
164 | @requires(TrainTestSplit, Training)
165 | class Predict(luigi.Task):
166 |     """推論"""
167 |     task_namespace = 'titanic_tasks'
168 | 
169 |     def output(self):
170 |         return luigi.LocalTarget("data/predict_data.csv")
171 | 
172 |     def run(self):
173 |         # データの読み込み
174 |         with self.input()[0][1].open() as f:
175 |             valid = pickle.load(f)
176 | 
177 |         # モデルの読み込み
178 |         with self.input()[1].open() as f:
179 |             model = pickle.load(f)
180 | 
181 |         logger.info(f'Valid data shape: {valid.shape}')
182 | 
183 |         target_col = 'survived'
184 |         X_valid = valid.drop(target_col, axis=1)
185 |         y_valid = valid[target_col]
186 | 
187 |         # 予測
188 |         y_pred = model.predict(X_valid)
189 |         logger.info(f'Accuracy Score: {accuracy_score(y_valid, y_pred)}')
190 |         logger.info('\n' + classification_report(y_valid, y_pred))
191 | 
192 |         # # 保存
193 |         valid.loc[:, 'y_pred'] = y_pred
194 |         valid.to_csv('data/predict_data.csv', index=False)
195 | 
196 | 
197 | @requires(Predict)
198 | class MyInvokerTask(luigi.WrapperTask):
199 |     task_namespace = 'titanic_tasks'
200 |     pass
201 | 
202 | 
203 | if __name__ == '__main__':
204 | 
205 |     # 設定ファイルの読み込み
206 |     luigi.configuration.LuigiConfigParser.add_config_path('./luigi.cfg')
207 |     # 実行
208 |     luigi.build([MyInvokerTask()], local_scheduler=True)
209 |     # luigi.build([MyInvokerTask()], local_scheduler=False)  # ブラウザからチェックしたい場合はこちら
210 | 


--------------------------------------------------------------------------------
/mlflow/output.txt:
--------------------------------------------------------------------------------
1 | Hello world sample!


--------------------------------------------------------------------------------
/mlflow/sample.py:
--------------------------------------------------------------------------------
 1 | import mlflow
 2 | from mlflow import log_metric, log_param, log_artifact, set_tag
 3 | 
 4 | if __name__ == "__main__":
 5 | 
 6 |     tracking_uri = '/Users/takapy/python/competition/mlflow/mlruns'
 7 |     mlflow.set_tracking_uri(tracking_uri)
 8 |     mlflow.set_experiment("test-experiment")
 9 |     mlflow.start_run(run_name='run_name001')
10 | 
11 |     # Log a parameter (key-value pair)
12 |     log_param('param1', 42)
13 | 
14 |     # Log a metric; metrics can be updated throughout the run
15 |     log_metric('fold1_score', 9.99)
16 |     log_metric('fold2_score', 9.92)
17 |     log_metric('fold3_score', 9.78)
18 | 
19 |     # Log an artifact (output file)
20 |     with open("output.txt", "w") as f:
21 |         f.write("Hello world sample!")
22 | 
23 |     log_artifact("output.txt")
24 | 
25 |     set_tag('tag1', 'this is tag1')
26 |     set_tag('tag2', 'this is tag2')
27 | 
28 |     mlflow.end_run()
29 | 


--------------------------------------------------------------------------------
/nlp/swem.py:
--------------------------------------------------------------------------------
  1 | import numpy as np
  2 | import pandas as pd
  3 | from gensim.models import word2vec
  4 | 
  5 | 
  6 | class SWEM():
  7 |     """単語埋め込み (Word Embedding) のみを利用して文章埋め込み (Sentence Embedding) を計算する
  8 | 
  9 |     参考URL:https://arxiv.org/abs/1805.09843v1
 10 | 
 11 |     Attributes:
 12 |         word2vec (word2vec): word2vecの事前学習モデル
 13 |         dim (int): word2vecの事前学習モデルの次元数
 14 |         oov_initialize_range (int): word2vecの事前学習モデルに含まれていない単語に割り当てるベクトル
 15 | 
 16 |     """
 17 | 
 18 |     def __init__(self, word2vec_model_name):
 19 |         self.word2vec = word2vec.Word2Vec.load(word2vec_model_name)
 20 |         self.dim = self.word2vec.trainables.layer1_size
 21 |         self.oov_initialize_range = (-0.01, 0.01)
 22 | 
 23 |     def get_word_embeddings(self, words) -> list:
 24 |         """word2vecから単語のベクトルを取得
 25 | 
 26 |         Args:
 27 |             words (list of str): 重みを取得したい単語のリスト
 28 | 
 29 |         Returns:
 30 |             list (float): 全単語のベクトルが格納された2次元リスト
 31 | 
 32 |         """
 33 |         np.random.seed(abs(hash(len(words))) % (10 ** 8))
 34 |         vectors = []
 35 |         for w in words:
 36 |             if w in self.word2vec:
 37 |                 vectors.append(self.word2vec[w])
 38 |             else:
 39 |                 vectors.append(np.random.uniform(self.oov_initialize_range[0], self.oov_initialize_range[1], self.dim))
 40 |         return vectors
 41 | 
 42 |     def average_pooling(self, text) -> np.array:
 43 |         """textに含まれる全単語ベクトルの次元毎の平均を計算する
 44 | 
 45 |         Args:
 46 |             text (str): ベクトルを計算したい文章
 47 | 
 48 |         Returns:
 49 |             np.array: 計算後のベクトル
 50 | 
 51 |         """
 52 |         emb = []
 53 |         for words in text:
 54 |             word_embeddings = self.get_word_embeddings(words)
 55 |             emb.append(np.nanmean(word_embeddings, axis=0))
 56 |         return np.array(emb)
 57 | 
 58 |     def max_pooling(self, text) -> np.array:
 59 |         """textに含まれる全単語ベクトルの次元毎の最大値を計算する
 60 | 
 61 |         Args:
 62 |             text (str): ベクトルを計算したい文章
 63 | 
 64 |         Returns:
 65 |             np.array: 計算後のベクトル
 66 | 
 67 |         """
 68 |         emb = []
 69 |         for words in text:
 70 |             word_embeddings = self.get_word_embeddings(words)
 71 |             emb.append(np.max(word_embeddings, axis=0))
 72 |         return np.array(emb)
 73 | 
 74 |     def concat_average_max_pooling(self, text) -> np.array:
 75 |         """textに含まれる全単語ベクトルの次元毎の平均値と最大値を計算した後それぞれを結合したベクトルを計算する
 76 | 
 77 |         平均ベクトル[1, 3, 4, 2, -2]と最大値ベクトル[5, 7, 3, 1, 3]があった場合に
 78 |         [1, 3, 4, 2, -2, 5, 7, 3, 1, 3]のベクトルを定義しreturnする
 79 | 
 80 |         Args:
 81 |             text (str): ベクトルを計算したい文章
 82 | 
 83 |         Returns:
 84 |             np.array: 計算後のベクトル
 85 | 
 86 |         """
 87 |         emb = []
 88 |         for words in text:
 89 |             word_embeddings = self.get_word_embeddings(words)
 90 |             emb.append(np.r_[np.nanmean(word_embeddings, axis=0), np.max(word_embeddings, axis=0)])
 91 |         return np.array(emb)
 92 | 
 93 |     def hier_or_avg_pooling(self, text, window) -> np.array:
 94 |         """textに含まれる単語に対してn-gramのように固定長のウィンドウでaverage-poolingした結果に対してmax poolingする
 95 | 
 96 |         単語数がwindowに満たない場合は、単純な平均（average_pooling）を計算する
 97 | 
 98 |         Args:
 99 |             text (str): ベクトルを計算したい文章
100 |             window (int): n-gramのウィンドウの幅
101 | 
102 |         Returns:
103 |             np.array: 計算後のベクトル
104 | 
105 |         """
106 |         emb = []
107 |         for words in text:
108 |             word_embeddings = self.get_word_embeddings(words)
109 |             text_len = len(word_embeddings)
110 |             if window > text_len:
111 |                 emb.append(np.nanmean(word_embeddings, axis=0))
112 |             else:
113 |                 window_average_pooling_vec = [np.nanmean(word_embeddings[i:i + window], axis=0)
114 |                                               for i in range(text_len - window + 1)]
115 |                 emb.append(np.max(window_average_pooling_vec, axis=0))
116 |         return np.array(emb)
117 | 
118 |     def calculate_emb(self, df, col, window, swem_type) -> pd.DataFrame:
119 |         """swemを用いて質問の埋め込みを算出する
120 | 
121 |         Args:
122 |             df (pd.Dataframe): 対象のDF
123 |             col (str): token化後のテキストが設定されているカラム名
124 |             window (int): hierarchical_poolingする際のwindow数
125 |             swem_type (int): SWEMをどの計算方法で算出するかを指定
126 |                             （1:average_pooling, 2:max_pooling, 3:concat_average_max_pooling, 4:hier_or_avg_pooling）
127 | 
128 |         Returns:
129 |             pd.DataFrame: 埋め込み(N次元)のデータフレーム
130 | 
131 |         """
132 | 
133 |         # 質問の埋め込みを計算
134 |         # swem_typeによって埋め込みの計算処理を分ける
135 |         if swem_type == 1:
136 |             swem_emb = self.average_pooling(df[col].values.tolist())
137 |         elif swem_type == 2:
138 |             swem_emb = self.max_pooling(df[col].values.tolist())
139 |         elif swem_type == 3:
140 |             swem_emb = self.concat_average_max_pooling(df[col].values.tolist())
141 |         else:
142 |             swem_emb = self.hier_or_avg_pooling(df[col].values.tolist(), window)
143 | 
144 |         # データフレームに変換
145 |         swem_emb = pd.DataFrame(swem_emb)
146 |         swem_emb = swem_emb.add_prefix('d_')
147 |         return swem_emb
148 | 


--------------------------------------------------------------------------------
/nlp/test_nlplot/2020-08-08_pyldavis.html:
--------------------------------------------------------------------------------
 1 | 
 2 | <link rel="stylesheet" type="text/css" href="https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.css">
 3 | 
 4 | 
 5 | <div id="ldavis_el660805246056512115579680"></div>
 6 | <script type="text/javascript">
 7 | 
 8 | var ldavis_el660805246056512115579680_data = {"mdsDat": {"x": [0.08507818728685379, -0.08507818728685379], "y": [0.0, 0.0], "topics": [1, 2], "cluster": [1, 1], "Freq": [55.54728698730469, 44.45270919799805]}, "tinfo": {"Term": ["kaggle", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "machinelearning", "python", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u6642\u7d661000\u5186", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5916\u8cc7\u7cfb", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u7d71\u8a08", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u6a5f\u68b0\u5b66\u7fd2", "superintelligence", "ai", "\u7d4c\u6e08\u5b66\u5f92", "deeplearning", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "iot", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "bragging", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u6c42\u4eba", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "titanic", "\u5927\u962a", "\u95a2\u897f", "\u6642\u7d661000\u5186", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "doe", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "mercariprize", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "it\u7d4c\u55b6", "\u6c42\u4eba", "freelancestart", "\u6848\u4ef6\u76f8\u5834", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u7d4c\u6e08\u5b66\u5f92", "\u30c7\u30fc\u30bf\u6d3b\u7528", "\u30a8\u30af\u30b9\u30d7\u30ed\u30e9\u30c8\u30ea\u30fc", "ibmspss", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u897f\u7530\u52d8\u4e00\u90ce", "\u7b4b\u30c8\u30ec", "\u30ec\u30b3\u30e1\u30f3\u30c9", "\u30a8\u30f3\u30b8\u30cb\u30a2\u8ee2\u8077", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "bigdata", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "uber", "\u90fd\u5e02\u7d4c\u6e08", "\u7d71\u8a08\u5b66", "\u4ea4\u901a\u7d4c\u6e08", "\u30c7\u30fc\u30bf\u5206\u6790", "datascience", "\u6a5f\u68b0\u5b66\u7fd2", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "kaggle", "datascientist", "ai", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "python", "\u4eba\u5de5\u77e5\u80fd", "\u7d71\u8a08", "100daysofcode", "machinelearning", "javascript", "winning", "\u5916\u8cc7\u7cfb\u4f01\u696d", "deep", "machine", "\u5916\u8cc7\u7cfb", "kansaiaipub", "\u8133\u6ce2", "santander", "\u30c1\u30e5\u30fc\u30c8\u30ea\u30a2\u30eb", "word2vec", "gcp", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "kernel", "golang", "nodered", "\u30e1\u30eb\u30ab\u30ea", "\u5927\u5b66\u767a", "\u5730\u57df\u79d1\u5b66", "\u521d\u5fc3\u8005\u5411\u3051", "\u6280\u8853\u66f8\u5178", "nodejs", "logisticregression", "\u91cf\u5b50\u30b3\u30f3\u30d4\u30e5\u30fc\u30bf", "\u7d71\u8a08\u5b66\u5c02\u653b", "ibmdojo", "\u5927\u5b66\u9662\u4fee\u58eb", "pytorch", "\u6295\u7968", "superintelligence", "deeplearning", "bragging", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "python", "iot", "kaggle", "\u7d71\u8a08", "it", "ml", "\u52c9\u5f37\u4f1a", "\u5927\u962a", "\u95a2\u897f", "kaggleguide", "lightgbm", "ai", "titanic", "\u6a5f\u68b0\u5b66\u7fd2", "note", "sql", "\u30a8\u30f3\u30b8\u30cb\u30a2", "signate", "\u7d71\u8a08\u5b66", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30c7\u30fc\u30bf\u5206\u6790", "100daysofcode", "\u4eba\u5de5\u77e5\u80fd", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "dena", "datascience", "\u4ea4\u901a\u7d4c\u6e08"], "Freq": [1118.0, 1254.0, 151.0, 224.0, 185.0, 360.0, 153.0, 155.0, 158.0, 99.0, 99.0, 98.0, 131.0, 81.0, 447.0, 43.0, 187.0, 57.0, 25.0, 57.0, 23.0, 25.0, 19.0, 21.0, 22.0, 29.0, 58.0, 26.0, 20.0, 20.0, 148.13937377929688, 177.83094787597656, 148.51284790039062, 150.3623504638672, 23.90238380432129, 75.82811737060547, 19.888797760009766, 12.205193519592285, 12.096858978271484, 21.1438045501709, 12.071139335632324, 11.287328720092773, 7.416588306427002, 11.830485343933105, 16.95538330078125, 8.824895858764648, 26.400768280029297, 7.331340312957764, 5.821954250335693, 316.46844482421875, 50.329017639160156, 5.0215888023376465, 4.299503803253174, 4.296093940734863, 12.15629768371582, 20.727745056152344, 4.2820563316345215, 6.416612148284912, 4.984185218811035, 4.270105361938477, 49.444339752197266, 1036.5762939453125, 12.086221694946289, 47.684120178222656, 11.852521896362305, 46.65898132324219, 46.09613037109375, 211.55172729492188, 44.902103424072266, 74.87315368652344, 31.280296325683594, 208.8214874267578, 18.050914764404297, 23.01530647277832, 283.5565185546875, 19.326860427856445, 73.9218978881836, 22.589630126953125, 33.403751373291016, 42.72502136230469, 21.717185974121094, 30.836090087890625, 20.262720108032227, 138.98007202148438, 7.638554573059082, 8.389654159545898, 89.51296997070312, 4.154168605804443, 4.1230669021606445, 88.53761291503906, 5.713052272796631, 4.891554355621338, 10.591192245483398, 4.055779933929443, 4.863409042358398, 5.663386821746826, 8.088590621948242, 4.037876605987549, 5.643205165863037, 5.634045600891113, 4.806703567504883, 4.799924850463867, 3.996715784072876, 3.9955856800079346, 4.787806987762451, 5.560303211212158, 3.16518235206604, 3.952819585800171, 84.48165130615234, 3.1538352966308594, 3.153036117553711, 4.702117443084717, 3.1191694736480713, 36.5382194519043, 21.823575973510742, 16.304643630981445, 11.664963722229004, 181.93736267089844, 19.836427688598633, 835.1495361328125, 100.68859100341797, 12.950469970703125, 12.889800071716309, 8.544548988342285, 15.907870292663574, 15.886055946350098, 12.534090042114258, 7.668683052062988, 113.75923919677734, 19.572282791137695, 238.68614196777344, 10.217280387878418, 11.872096061706543, 24.502782821655273, 11.369624137878418, 93.4170150756836, 217.8430633544922, 26.186643600463867, 39.257747650146484, 19.786203384399414, 18.099971771240234, 44.19781494140625, 12.973487854003906, 13.596736907958984, 13.791600227355957], "Total": [1118.0, 1254.0, 151.0, 224.0, 185.0, 360.0, 153.0, 155.0, 158.0, 99.0, 99.0, 98.0, 131.0, 81.0, 447.0, 43.0, 187.0, 57.0, 25.0, 57.0, 23.0, 25.0, 19.0, 21.0, 22.0, 29.0, 58.0, 26.0, 20.0, 20.0, 153.24288940429688, 185.2081756591797, 155.06573486328125, 158.53990173339844, 25.352550506591797, 81.049072265625, 21.288394927978516, 13.105955123901367, 13.123124122619629, 22.96909523010254, 13.127167701721191, 12.311968803405762, 8.225051879882812, 13.165611267089844, 18.934579849243164, 9.8820219039917, 29.657596588134766, 8.238725662231445, 6.597639560699463, 360.666259765625, 57.829856872558594, 5.784577369689941, 4.958719730377197, 4.959305286407471, 14.054414749145508, 23.976825714111328, 4.9615678787231445, 7.443854331970215, 5.790389537811279, 4.9636077880859375, 57.97434997558594, 1254.4193115234375, 14.065719604492188, 58.251060485839844, 14.103730201721191, 58.416072845458984, 58.5046501159668, 304.96875, 58.693702697753906, 114.13090515136719, 44.87703323364258, 447.50762939453125, 23.463544845581055, 33.02202606201172, 1118.7060546875, 26.08376121520996, 187.68113708496094, 33.09010314941406, 59.59039306640625, 224.66238403320312, 39.81715774536133, 131.52468872070312, 40.04892349243164, 151.4040069580078, 8.35476016998291, 9.269570350646973, 99.15031433105469, 4.629241466522217, 4.624869346618652, 99.82665252685547, 6.466634273529053, 5.542027950286865, 12.006967544555664, 4.6154632568359375, 5.538034439086914, 6.459675312042236, 9.227800369262695, 4.6131134033203125, 6.456885814666748, 6.455682277679443, 5.530396938323975, 5.529428958892822, 4.607379913330078, 4.607212543487549, 5.527658462524414, 6.445369720458984, 3.681478977203369, 4.601385593414307, 98.45637512207031, 3.6798195838928223, 3.6798486709594727, 5.516012668609619, 3.6751370429992676, 43.165645599365234, 25.725200653076172, 19.28432846069336, 13.77755355834961, 224.66238403320312, 23.828641891479492, 1118.7060546875, 131.52468872070312, 15.577095031738281, 15.569125175476074, 10.102041244506836, 20.04140281677246, 20.038246154785156, 15.519177436828613, 9.170105934143066, 187.68113708496094, 26.225311279296875, 447.50762939453125, 12.766529083251953, 16.23989486694336, 42.32276916503906, 16.17015838623047, 304.96875, 1254.4193115234375, 59.59039306640625, 114.13090515136719, 40.04892349243164, 39.81715774536133, 360.666259765625, 22.882408142089844, 44.87703323364258, 58.693702697753906], "Category": ["Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2"], "logprob": [30.0, 29.0, 28.0, 27.0, 26.0, 25.0, 24.0, 23.0, 22.0, 21.0, 20.0, 19.0, 18.0, 17.0, 16.0, 15.0, 14.0, 13.0, 12.0, 11.0, 10.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, -3.6851000785827637, -3.5023999214172363, -3.682499885559082, -3.6702001094818115, -5.509200096130371, -4.354700088500977, -5.6930999755859375, -6.181399822235107, -6.190299987792969, -5.631899833679199, -6.192399978637695, -6.259500026702881, -6.679500102996826, -6.212500095367432, -5.85260009765625, -6.5055999755859375, -5.409800052642822, -6.691100120544434, -6.921599864959717, -2.9260001182556152, -4.764599800109863, -7.069499969482422, -7.224699974060059, -7.225500106811523, -6.185400009155273, -5.651700019836426, -7.228799819946289, -6.8242998123168945, -7.076900005340576, -7.231599807739258, -4.782400131225586, -1.7395000457763672, -6.191199779510498, -4.818600177764893, -6.210700035095215, -4.840400218963623, -4.852499961853027, -3.328700065612793, -4.878699779510498, -4.367400169372559, -5.240200042724609, -3.3417000770568848, -5.789999961853027, -5.547100067138672, -3.035799980163574, -5.721700191497803, -4.380199909210205, -5.565700054168701, -5.174499988555908, -4.928400039672852, -5.605100154876709, -5.254499912261963, -5.6743998527526855, -3.526099920272827, -6.427199840545654, -6.333399772644043, -3.9660000801086426, -7.036300182342529, -7.043799877166748, -3.9769999980926514, -6.717700004577637, -6.872900009155273, -6.100399971008301, -7.060299873352051, -6.878699779510498, -6.726399898529053, -6.369999885559082, -7.064700126647949, -6.730000019073486, -6.731599807739258, -6.890399932861328, -6.8917999267578125, -7.074900150299072, -7.075200080871582, -6.8942999839782715, -6.744800090789795, -7.308199882507324, -7.085999965667725, -4.023900032043457, -7.311800003051758, -7.311999797821045, -6.912399768829346, -7.322800159454346, -4.861999988555908, -5.377399921417236, -5.669000148773193, -6.003799915313721, -3.256700038909912, -5.472899913787842, -1.732800006866455, -3.848400115966797, -5.8993000984191895, -5.9039998054504395, -6.315100193023682, -5.693600177764893, -5.695000171661377, -5.932000160217285, -6.423299789428711, -3.726300001144409, -5.486299991607666, -2.985300064086914, -6.136300086975098, -5.986199855804443, -5.261600017547607, -6.0295000076293945, -3.92330002784729, -3.0766000747680664, -5.195199966430664, -4.790299892425537, -5.475399971008301, -5.564499855041504, -4.6717000007629395, -5.897500038146973, -5.850599765777588, -5.836299896240234], "loglift": [30.0, 29.0, 28.0, 27.0, 26.0, 25.0, 24.0, 23.0, 22.0, 21.0, 20.0, 19.0, 18.0, 17.0, 16.0, 15.0, 14.0, 13.0, 12.0, 11.0, 10.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.554099977016449, 0.5472999811172485, 0.5447999835014343, 0.5350000262260437, 0.5289999842643738, 0.5213000178337097, 0.5199000239372253, 0.516700029373169, 0.5065000057220459, 0.5051000118255615, 0.5041000247001648, 0.5009999871253967, 0.484499990940094, 0.48100000619888306, 0.47749999165534973, 0.4747999906539917, 0.4715999960899353, 0.47119998931884766, 0.4629000127315521, 0.45719999074935913, 0.4490000009536743, 0.4465000033378601, 0.44530001282691956, 0.44440001249313354, 0.44279998540878296, 0.4422999918460846, 0.4406000077724457, 0.43939998745918274, 0.43799999356269836, 0.4374000132083893, 0.42879998683929443, 0.39719998836517334, 0.43630000948905945, 0.387800008058548, 0.414000004529953, 0.36320000886917114, 0.3495999872684479, 0.22220000624656677, 0.32010000944137573, 0.1664000004529953, 0.22699999809265137, -0.17430000007152557, 0.3257000148296356, 0.22689999639987946, -0.784600019454956, 0.288100004196167, -0.34380000829696655, 0.2062000036239624, 0.009100000374019146, -1.0719000101089478, -0.018300000578165054, -0.8626000285148621, -0.0934000015258789, 0.7250999808311462, 0.7210999727249146, 0.7110000252723694, 0.7085000276565552, 0.7024999856948853, 0.695900022983551, 0.6906999945640564, 0.6868000030517578, 0.6858999729156494, 0.6852999925613403, 0.6815000176429749, 0.6808000206947327, 0.6791999936103821, 0.6790000200271606, 0.6776000261306763, 0.6759999990463257, 0.6746000051498413, 0.6704999804496765, 0.6693000197410583, 0.6686000227928162, 0.6682999730110168, 0.6671000123023987, 0.6629999876022339, 0.659600019454956, 0.6588000059127808, 0.6577000021934509, 0.656499981880188, 0.6561999917030334, 0.6510999798774719, 0.6467000246047974, 0.64410001039505, 0.6463000178337097, 0.6428999900817871, 0.6442999839782715, 0.5997999906539917, 0.6273999810218811, 0.5184000134468079, 0.5436000227928162, 0.6261000037193298, 0.6219000220298767, 0.6432999968528748, 0.579800009727478, 0.578499972820282, 0.597100019454956, 0.6319000124931335, 0.3100999891757965, 0.5181000232696533, 0.18219999969005585, 0.5879999995231628, 0.4975000023841858, 0.26420000195503235, 0.4584999978542328, -0.3723999857902527, -0.9398999810218811, -0.011500000022351742, -0.2565000057220459, 0.10559999942779541, 0.02239999920129776, -1.2884999513626099, 0.24330000579357147, -0.38339999318122864, -0.637499988079071]}, "token.table": {"Topic": [1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2], "Freq": [0.4993892014026642, 0.4993892014026642, 0.39428576827049255, 0.6074131727218628, 0.897828221321106, 0.10562685132026672, 0.8531380295753479, 0.14218966662883759, 0.1555667370557785, 0.8296892642974854, 0.690776526927948, 0.31196358799934387, 0.7284225821495056, 0.2683662176132202, 0.8640724420547485, 0.15548954904079437, 0.8551925420761108, 0.43701693415641785, 0.5681220293045044, 0.9156143069267273, 0.0763011947274208, 0.8496459722518921, 0.12137799710035324, 0.15480653941631317, 0.9288392663002014, 0.15487341582775116, 0.9292405247688293, 0.2717524468898773, 0.8152573704719543, 0.8065645694732666, 0.20164114236831665, 0.16786521673202515, 0.8393260836601257, 0.19259046018123627, 0.8345586657524109, 0.9107447862625122, 0.101193867623806, 0.11969224363565445, 0.9575379490852356, 0.25386473536491394, 0.7463980317115784, 0.1933092176914215, 0.8376732468605042, 0.15463994443416595, 0.9278396964073181, 0.21677334606647491, 0.8670933842658997, 0.21809998154640198, 0.8723999261856079, 0.2716299593448639, 0.8148899078369141, 0.21622233092784882, 0.8648893237113953, 0.07925813645124435, 0.9180734753608704, 0.9114654660224915, 0.07595545798540115, 0.19268906116485596, 0.8349859118461609, 0.1551501303911209, 0.9309008121490479, 0.15490229427814484, 0.9294137954711914, 0.2349894791841507, 0.7832982540130615, 0.19139830768108368, 0.810104489326477, 0.1812903732061386, 0.9064518809318542, 0.08328497409820557, 0.9161347150802612, 0.3092115521430969, 0.6802654266357422, 0.24630701541900635, 0.738921046257019, 0.16216599941253662, 0.85716313123703, 0.26691770553588867, 0.7626219987869263, 0.8045730590820312, 0.20542292296886444, 0.10787986218929291, 0.8630388975143433, 0.18056948482990265, 0.902847409248352, 0.1451636552810669, 0.8709819316864014, 0.9461340308189392, 0.05046048387885094, 0.960882842540741, 0.045142143964767456, 0.8066598176956177, 0.20166495442390442, 0.42530298233032227, 0.5906985998153687, 0.10836818814277649, 0.8669455051422119, 0.805865466594696, 0.201466366648674, 0.21666297316551208, 0.8666518926620483, 0.8761562705039978, 0.1219964399933815, 0.8266773223876953, 0.17378559708595276, 0.893439531326294, 0.08122178167104721, 0.9466503262519836, 0.039443764835596085, 0.6571401357650757, 0.3417128920555115, 0.8643673658370972, 0.17287348210811615, 0.9142719507217407, 0.08707351982593536, 0.9394789934158325, 0.046973951160907745, 0.9377034902572632, 0.06169101968407631, 0.853824257850647, 0.14230403304100037, 0.6965048313140869, 0.30282819271087646, 0.8508387207984924, 0.1418064534664154, 0.8240193128585815, 0.18883776664733887, 0.9610806703567505, 0.037795308977365494, 0.8452013731002808, 0.15524107217788696, 0.1808188408613205, 0.9040942192077637, 0.8634997606277466, 0.1726999580860138, 0.7666921019554138, 0.23852643370628357, 0.5525256395339966, 0.45206642150878906, 0.6950718760490417, 0.33242568373680115, 0.21705098450183868, 0.8682039380073547, 0.19797979295253754, 0.8909090757369995, 0.21704310178756714, 0.8681724071502686, 0.11019100993871689, 0.8915454745292664, 0.1008569672703743, 0.9077126979827881, 0.18085050582885742, 0.9042525291442871, 0.2717503011226654, 0.8152509331703186, 0.19958682358264923, 0.7983472943305969, 0.9144164323806763, 0.07620136439800262, 0.1809084266424179, 0.9045421481132507, 0.27209869027137756, 0.8162961006164551, 0.9657870531082153, 0.03262794017791748, 0.8510584831237793, 0.12157978117465973, 0.9141347408294678, 0.07617789506912231, 0.909416139125824, 0.15156936645507812, 0.4670311510562897, 0.5340691208839417, 0.875845730304718, 0.12512081861495972, 0.8766725063323975, 0.10115452110767365, 0.8060340285301208, 0.13433900475502014, 0.8646053075790405, 0.13833685219287872, 0.2356971949338913, 0.7679166793823242, 0.6951531767845154, 0.3049492835998535, 0.1421949565410614, 0.8531697392463684, 0.18043936789035797, 0.9021968245506287, 0.8061967492103577, 0.20154918730258942, 0.7862622737884521, 0.20511190593242645, 0.2173258364200592, 0.8693033456802368, 0.19961826503276825, 0.798473060131073, 0.7671474814414978, 0.2130965292453766, 0.5537805557250977, 0.4363119304180145], "Term": ["100daysofcode", "100daysofcode", "ai", "ai", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "bigdata", "bigdata", "bragging", "bragging", "datascience", "datascience", "datascientist", "datascientist", "deep", "deeplearning", "deeplearning", "dena", "dena", "doe", "doe", "freelancestart", "freelancestart", "gcp", "gcp", "golang", "golang", "ibmdojo", "ibmdojo", "ibmspss", "ibmspss", "iot", "iot", "it", "it", "it\u7d4c\u55b6", "it\u7d4c\u55b6", "javascript", "javascript", "kaggle", "kaggle", "kaggleguide", "kaggleguide", "kansaiaipub", "kansaiaipub", "kernel", "kernel", "lightgbm", "lightgbm", "logisticregression", "logisticregression", "machine", "machine", "machinelearning", "machinelearning", "mercariprize", "mercariprize", "ml", "ml", "nodejs", "nodejs", "nodered", "nodered", "note", "note", "python", "python", "pytorch", "pytorch", "santander", "santander", "signate", "signate", "sql", "sql", "superintelligence", "superintelligence", "titanic", "titanic", "uber", "uber", "winning", "winning", "word2vec", "word2vec", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a8\u30af\u30b9\u30d7\u30ed\u30e9\u30c8\u30ea\u30fc", "\u30a8\u30af\u30b9\u30d7\u30ed\u30e9\u30c8\u30ea\u30fc", "\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30a8\u30f3\u30b8\u30cb\u30a2\u8ee2\u8077", "\u30a8\u30f3\u30b8\u30cb\u30a2\u8ee2\u8077", "\u30c1\u30e5\u30fc\u30c8\u30ea\u30a2\u30eb", "\u30c1\u30e5\u30fc\u30c8\u30ea\u30a2\u30eb", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30c7\u30fc\u30bf\u5206\u6790", "\u30c7\u30fc\u30bf\u5206\u6790", "\u30c7\u30fc\u30bf\u6d3b\u7528", "\u30c7\u30fc\u30bf\u6d3b\u7528", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30e1\u30eb\u30ab\u30ea", "\u30e1\u30eb\u30ab\u30ea", "\u30ec\u30b3\u30e1\u30f3\u30c9", "\u30ec\u30b3\u30e1\u30f3\u30c9", "\u4ea4\u901a\u7d4c\u6e08", "\u4ea4\u901a\u7d4c\u6e08", "\u4eba\u5de5\u77e5\u80fd", "\u4eba\u5de5\u77e5\u80fd", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "\u521d\u5fc3\u8005\u5411\u3051", "\u521d\u5fc3\u8005\u5411\u3051", "\u52c9\u5f37\u4f1a", "\u52c9\u5f37\u4f1a", "\u5730\u57df\u79d1\u5b66", "\u5730\u57df\u79d1\u5b66", "\u5916\u8cc7\u7cfb", "\u5916\u8cc7\u7cfb", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5927\u5b66\u767a", "\u5927\u5b66\u767a", "\u5927\u5b66\u9662\u4fee\u58eb", "\u5927\u5b66\u9662\u4fee\u58eb", "\u5927\u962a", "\u5927\u962a", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "\u6280\u8853\u66f8\u5178", "\u6280\u8853\u66f8\u5178", "\u6295\u7968", "\u6295\u7968", "\u6642\u7d661000\u5186", "\u6642\u7d661000\u5186", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u6848\u4ef6\u76f8\u5834", "\u6848\u4ef6\u76f8\u5834", "\u6a5f\u68b0\u5b66\u7fd2", "\u6a5f\u68b0\u5b66\u7fd2", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u6c42\u4eba", "\u6c42\u4eba", "\u7b4b\u30c8\u30ec", "\u7b4b\u30c8\u30ec", "\u7d4c\u6e08\u5b66\u5f92", "\u7d4c\u6e08\u5b66\u5f92", "\u7d71\u8a08", "\u7d71\u8a08", "\u7d71\u8a08\u5b66", "\u7d71\u8a08\u5b66", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u8133\u6ce2", "\u8133\u6ce2", "\u897f\u7530\u52d8\u4e00\u90ce", "\u897f\u7530\u52d8\u4e00\u90ce", "\u90fd\u5e02\u7d4c\u6e08", "\u90fd\u5e02\u7d4c\u6e08", "\u91cf\u5b50\u30b3\u30f3\u30d4\u30e5\u30fc\u30bf", "\u91cf\u5b50\u30b3\u30f3\u30d4\u30e5\u30fc\u30bf", "\u95a2\u897f", "\u95a2\u897f", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044"]}, "R": 30, "lambda.step": 0.01, "plot.opts": {"xlab": "PC1", "ylab": "PC2"}, "topic.order": [1, 2]};
 9 | 
10 | function LDAvis_load_lib(url, callback){
11 |   var s = document.createElement('script');
12 |   s.src = url;
13 |   s.async = true;
14 |   s.onreadystatechange = s.onload = callback;
15 |   s.onerror = function(){console.warn("failed to load library " + url);};
16 |   document.getElementsByTagName("head")[0].appendChild(s);
17 | }
18 | 
19 | if(typeof(LDAvis) !== "undefined"){
20 |    // already loaded: just create the visualization
21 |    !function(LDAvis){
22 |        new LDAvis("#" + "ldavis_el660805246056512115579680", ldavis_el660805246056512115579680_data);
23 |    }(LDAvis);
24 | }else if(typeof define === "function" && define.amd){
25 |    // require.js is available: use it to load d3/LDAvis
26 |    require.config({paths: {d3: "https://cdnjs.cloudflare.com/ajax/libs/d3/3.5.5/d3.min"}});
27 |    require(["d3"], function(d3){
28 |       window.d3 = d3;
29 |       LDAvis_load_lib("https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.js", function(){
30 |         new LDAvis("#" + "ldavis_el660805246056512115579680", ldavis_el660805246056512115579680_data);
31 |       });
32 |     });
33 | }else{
34 |     // require.js not available: dynamically load d3 & LDAvis
35 |     LDAvis_load_lib("https://cdnjs.cloudflare.com/ajax/libs/d3/3.5.5/d3.min.js", function(){
36 |          LDAvis_load_lib("https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.js", function(){
37 |                  new LDAvis("#" + "ldavis_el660805246056512115579680", ldavis_el660805246056512115579680_data);
38 |             })
39 |          });
40 | }
41 | </script>


--------------------------------------------------------------------------------
/nlp/twitter_analytics_using_nlplot/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/takapy0210/geek_blog/e36604f01d26f4d14bdacc6bb2995c929d49fdfa/nlp/twitter_analytics_using_nlplot/.DS_Store


--------------------------------------------------------------------------------
/nlp/twitter_analytics_using_nlplot/2020-05-17_pyldavis.html:
--------------------------------------------------------------------------------
 1 | 
 2 | <link rel="stylesheet" type="text/css" href="https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.css">
 3 | 
 4 | 
 5 | <div id="ldavis_el1364554314548401154813291"></div>
 6 | <script type="text/javascript">
 7 | 
 8 | var ldavis_el1364554314548401154813291_data = {"mdsDat": {"x": [0.14732801914215088, -0.14732801914215088], "y": [0.0, 0.0], "topics": [1, 2], "cluster": [1, 1], "Freq": [54.23051834106445, 45.76948165893555]}, "tinfo": {"Category": ["Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2"], "Freq": [1083.0, 1291.0, 373.0, 215.0, 193.0, 143.0, 165.0, 160.0, 162.0, 445.0, 93.0, 94.0, 93.0, 126.0, 84.0, 59.0, 59.0, 59.0, 41.0, 59.0, 59.0, 59.0, 184.0, 309.0, 24.0, 30.0, 25.0, 40.0, 26.0, 23.0, 159.1615447998047, 192.03477478027344, 160.61325073242188, 163.70472717285156, 82.86725616455078, 25.845924377441406, 21.581838607788086, 58.06324005126953, 23.222187042236328, 57.8823356628418, 29.681936264038086, 57.521446228027344, 13.140117645263672, 13.11875057220459, 13.117197036743164, 57.3104133605957, 23.732013702392578, 12.26113510131836, 18.796680450439453, 57.19434356689453, 355.6851501464844, 56.94751739501953, 13.729220390319824, 8.042810440063477, 8.026191711425781, 9.6015625, 7.945532321929932, 8.738409042358398, 7.138285160064697, 6.3428497314453125, 13.41327953338623, 1131.92236328125, 13.374342918395996, 12.518911361694336, 23.42352294921875, 226.88595581054688, 13.766777038574219, 79.88345336914062, 27.04385757446289, 125.40335845947266, 22.63872528076172, 60.304473876953125, 29.066852569580078, 20.645004272460938, 22.969127655029297, 83.40772247314453, 20.752046585083008, 139.58328247070312, 91.32024383544922, 91.79608154296875, 90.27067565917969, 39.439064025878906, 17.422725677490234, 10.748383522033691, 23.112539291381836, 12.357230186462402, 8.23248291015625, 7.3996076583862305, 18.083534240722656, 8.187993049621582, 13.905789375305176, 23.55620574951172, 8.11656379699707, 8.920405387878418, 13.751631736755371, 1000.2832641601562, 8.05480670928955, 7.246626853942871, 5.631561279296875, 5.627683639526367, 5.624212741851807, 5.6226372718811035, 6.418981075286865, 5.609947204589844, 196.89468383789062, 17.56036376953125, 5.578864574432373, 113.30939483642578, 13.53644847869873, 13.522589683532715, 9.544998168945312, 19.937145233154297, 7.172063827514648, 13.91380500793457, 33.347042083740234, 319.61688232421875, 19.261877059936523, 124.07888793945312, 10.850387573242188, 13.34872055053711, 11.343375205993652, 10.637520790100098, 13.892083168029785, 30.668466567993164, 82.59089660644531, 160.03582763671875, 22.895910263061523, 35.442535400390625, 19.03139305114746, 16.472131729125977, 17.645444869995117, 14.312366485595703], "Term": ["kaggle", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "python", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "machinelearning", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u6642\u7d661000\u5186", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u6a5f\u68b0\u5b66\u7fd2", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5916\u8cc7\u7cfb", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u7d71\u8a08", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u7d4c\u6e08\u5b66\u5f92", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "superintelligence", "uber", "\u90fd\u5e02\u7d4c\u6e08", "\u4ea4\u901a\u7d4c\u6e08", "ai", "\u7d71\u8a08\u5b66", "deeplearning", "\u6c42\u4eba", "titanic", "100daysofcode", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u6642\u7d661000\u5186", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u7d4c\u6e08\u5b66\u5f92", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u6c42\u4eba", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "doe", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "uber", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "\u90fd\u5e02\u7d4c\u6e08", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u4ea4\u901a\u7d4c\u6e08", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "freelancestart", "it\u7d4c\u55b6", "rapidminer", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9\u30b9\u30bf\u30fc\u30c8", "\u7b4b\u30c8\u30ec", "\u6848\u4ef6\u76f8\u5834", "bigdata", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "mercariprize", "datascientist", "\u7d71\u8a08\u5b66", "\u30c7\u30fc\u30bf\u89e3\u6790", "\u30c7\u30fc\u30bf\u5206\u6790", "\u30a8\u30f3\u30b8\u30cb\u30a2", "\u6a5f\u68b0\u5b66\u7fd2", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "ai", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "datascience", "kaggle", "\u4eba\u5de5\u77e5\u80fd", "machinelearning", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5916\u8cc7\u7cfb", "\u7d71\u8a08\u5b66\u5c02\u653b", "superintelligence", "bragging", "santander", "deeplearning", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "winning", "javascript", "\u95a2\u897f", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "kaggleguide", "titanic", "lightgbm", "\u52c9\u5f37\u4f1a", "ml", "kaggle", "ncaa", "gbdt", "kansaiaipub", "gcp", "golang", "nodered", "\u30b5\u30f3\u30bf\u672c\u6c17\u51fa\u3059", "nodejs", "python", "\u5927\u962a", "\u30a2\u30f3\u30b5\u30f3\u30d6\u30eb", "\u7d71\u8a08", "kaggler", "it", "xgboost", "iot", "t5", "sql", "100daysofcode", "\u6a5f\u68b0\u5b66\u7fd2", "dena", "ai", "note", "signate", "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406", "pandas", "twitter\u6c42\u4eba", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u7d71\u8a08\u5b66", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "datascience", "\u30c7\u30fc\u30bf\u5206\u6790", "\u4eba\u5de5\u77e5\u80fd", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u30a8\u30f3\u30b8\u30cb\u30a2"], "Total": [1083.0, 1291.0, 373.0, 215.0, 193.0, 143.0, 165.0, 160.0, 162.0, 445.0, 93.0, 94.0, 93.0, 126.0, 84.0, 59.0, 59.0, 59.0, 41.0, 59.0, 59.0, 59.0, 184.0, 309.0, 24.0, 30.0, 25.0, 40.0, 26.0, 23.0, 160.42955017089844, 193.71583557128906, 162.14352416992188, 165.56649780273438, 84.50923156738281, 26.464859008789062, 22.198930740356445, 59.768863677978516, 23.907058715820312, 59.7746467590332, 30.742984771728516, 59.78443908691406, 13.664724349975586, 13.66533088684082, 13.665366172790527, 59.79075241088867, 24.77018165588379, 12.812346458435059, 19.64603042602539, 59.793907165527344, 373.3305969238281, 59.80083465576172, 14.525452613830566, 8.545166015625, 8.545663833618164, 10.255602836608887, 8.547869682312012, 9.402857780456543, 7.693454265594482, 6.838641166687012, 14.534539222717285, 1291.958251953125, 14.5357666015625, 13.682260513305664, 26.535221099853516, 309.47686767578125, 15.402151107788086, 115.32598876953125, 41.356224060058594, 445.0202331542969, 33.582035064697266, 184.38336181640625, 59.735321044921875, 33.64012908935547, 45.86503601074219, 1083.6910400390625, 39.78343963623047, 143.019287109375, 93.8747787475586, 94.74134063720703, 93.84490966796875, 41.21466827392578, 18.409175872802734, 11.394981384277344, 24.542604446411133, 13.14686393737793, 8.764246940612793, 7.8875885009765625, 19.2811336517334, 8.762985229492188, 14.896851539611816, 25.408126831054688, 8.760986328125, 9.636826515197754, 14.892617225646973, 1083.6910400390625, 8.759186744689941, 7.883160591125488, 6.131120681762695, 6.13102388381958, 6.130922317504883, 6.130888938903809, 7.006433963775635, 6.130496978759766, 215.4542236328125, 19.266185760498047, 6.129637241363525, 126.91802215576172, 14.886463165283203, 14.885948181152344, 10.507631301879883, 22.74604606628418, 7.881027698516846, 15.750205993652344, 40.18912124633789, 445.0202331542969, 22.726892471313477, 184.38336181640625, 12.250751495361328, 15.7340087890625, 13.117923736572266, 12.24471664428711, 18.308910369873047, 59.735321044921875, 309.47686767578125, 1291.958251953125, 45.86503601074219, 115.32598876953125, 39.78343963623047, 31.179227828979492, 373.3305969238281, 41.356224060058594], "loglift": [30.0, 29.0, 28.0, 27.0, 26.0, 25.0, 24.0, 23.0, 22.0, 21.0, 20.0, 19.0, 18.0, 17.0, 16.0, 15.0, 14.0, 13.0, 12.0, 11.0, 10.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.6039999723434448, 0.6032000184059143, 0.602400004863739, 0.600600004196167, 0.5922999978065491, 0.5882999897003174, 0.5837000012397766, 0.5830000042915344, 0.5828999876976013, 0.579800009727478, 0.5767999887466431, 0.5733000040054321, 0.5727999806404114, 0.5710999965667725, 0.5709999799728394, 0.569599986076355, 0.569100022315979, 0.5680000185966492, 0.5677000284194946, 0.5674999952316284, 0.5634999871253967, 0.5630000233650208, 0.5555999875068665, 0.5512999892234802, 0.5491999983787537, 0.5460000038146973, 0.5389000177383423, 0.5386000275611877, 0.5370000004768372, 0.5367000102996826, 0.5315999984741211, 0.4796999990940094, 0.5286999940872192, 0.5231000185012817, 0.487199991941452, 0.30149999260902405, 0.49970000982284546, 0.24469999969005585, 0.18719999492168427, -0.654699981212616, 0.2176000028848648, -0.5056999921798706, -0.10840000212192535, 0.12370000034570694, -0.07959999889135361, -1.9524999856948853, -0.03889999911189079, 0.7572000026702881, 0.7540000081062317, 0.75, 0.7426999807357788, 0.737500011920929, 0.7264999747276306, 0.7231000065803528, 0.7214999794960022, 0.7196000218391418, 0.718999981880188, 0.7177000045776367, 0.7174000144004822, 0.713699996471405, 0.7127000093460083, 0.7059000134468079, 0.7052000164985657, 0.7042999863624573, 0.7017999887466431, 0.7014999985694885, 0.697700023651123, 0.6973999738693237, 0.6966000199317932, 0.695900022983551, 0.6952999830245972, 0.6949999928474426, 0.6940000057220459, 0.692799985408783, 0.6915000081062317, 0.6887999773025513, 0.6873999834060669, 0.6680999994277954, 0.6865000128746033, 0.6855000257492065, 0.6855000257492065, 0.6496999859809875, 0.6873000264167786, 0.6575999855995178, 0.5949000120162964, 0.4505999982357025, 0.616100013256073, 0.3855000138282776, 0.6601999998092651, 0.6171000003814697, 0.6362000107765198, 0.6407999992370605, 0.5055000185966492, 0.11490000039339066, -0.5393999814987183, -1.3070000410079956, 0.0868000015616417, -0.3982999920845032, 0.044199999421834946, 0.14350000023841858, -2.270400047302246, -0.27950000762939453], "logprob": [30.0, 29.0, 28.0, 27.0, 26.0, 25.0, 24.0, 23.0, 22.0, 21.0, 20.0, 19.0, 18.0, 17.0, 16.0, 15.0, 14.0, 13.0, 12.0, 11.0, 10.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, -3.5892999172210693, -3.4014999866485596, -3.580199956893921, -3.561199903488159, -4.242000102996826, -5.407100200653076, -5.587399959564209, -4.597700119018555, -5.514100074768066, -4.600800037384033, -5.268700122833252, -4.607100009918213, -6.083600044250488, -6.08519983291626, -6.085299968719482, -4.6107001304626465, -5.492400169372559, -6.1528000831604, -5.725500106811523, -4.612800121307373, -2.7852001190185547, -4.617099761962891, -6.039700031280518, -6.574399948120117, -6.576499938964844, -6.397299766540527, -6.586599826812744, -6.491499900817871, -6.69379997253418, -6.8119001388549805, -6.063000202178955, -1.6275999546051025, -6.065899848937988, -6.131999969482422, -5.505499839782715, -3.234800100326538, -6.0370001792907715, -4.27869987487793, -5.361800193786621, -3.827699899673462, -5.539599895477295, -4.559800148010254, -5.289599895477295, -5.631800174713135, -5.525100231170654, -4.235499858856201, -5.6265997886657715, -3.5508999824523926, -3.9751999378204346, -3.9700000286102295, -3.986799955368042, -4.814799785614014, -5.631800174713135, -6.114799976348877, -5.3491997718811035, -5.975399971008301, -6.381499767303467, -6.4882001876831055, -5.594600200653076, -6.386899948120117, -5.8572998046875, -5.3302001953125, -6.395699977874756, -6.301300048828125, -5.8684000968933105, -1.5815999507904053, -6.403299808502197, -6.509099960327148, -6.761199951171875, -6.761899948120117, -6.762499809265137, -6.762800216674805, -6.630300045013428, -6.765100002288818, -3.206899881362915, -5.624000072479248, -6.770599842071533, -3.759500026702881, -5.884200096130371, -5.885200023651123, -6.23360013961792, -5.497000217437744, -6.519400119781494, -5.8566999435424805, -4.982600212097168, -2.7225000858306885, -5.531499862670898, -3.6686999797821045, -6.105400085449219, -5.898200035095215, -6.060999870300293, -6.125199794769287, -5.85830020904541, -5.066400051116943, -4.075699806213379, -3.4142000675201416, -5.35860013961792, -4.9217000007629395, -5.543499946594238, -5.687900066375732, -5.619100093841553, -5.828499794006348]}, "token.table": {"Topic": [1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 2, 1, 2, 1, 2, 1, 2, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2], "Freq": [0.17417648434638977, 0.8211177587509155, 0.3254089653491974, 0.672511875629425, 0.9671164751052856, 0.05090086907148361, 0.8944212198257446, 0.0688016340136528, 0.05432073771953583, 0.9234525561332703, 0.5014713406562805, 0.5014713406562805, 0.866772472858429, 0.11305728554725647, 0.04074547067284584, 0.9371458292007446, 0.13200220465660095, 0.8360139727592468, 0.9513547420501709, 0.07318112999200821, 0.9361472725868225, 0.11701840907335281, 0.12685267627239227, 0.8879687190055847, 0.16310489177703857, 0.9786293506622314, 0.16310758888721466, 0.9786455631256104, 0.13189105689525604, 0.8792737126350403, 0.06717744469642639, 0.9404842853546143, 0.9750767350196838, 0.09750767797231674, 0.8874702453613281, 0.07659009844064713, 0.922772228717804, 0.06712827831506729, 0.9397959113121033, 0.06717512011528015, 0.9404517412185669, 0.9786139130592346, 0.11414240300655365, 0.9131392240524292, 0.020976191386580467, 0.9788889288902283, 0.9501354098320007, 0.07308733463287354, 0.06714736670255661, 0.9400631189346313, 0.11416584998369217, 0.9133267998695374, 0.16311891376972198, 0.9787134528160095, 0.1631084829568863, 0.9786509275436401, 0.08162764459848404, 0.897904098033905, 0.16333575546741486, 0.8983466625213623, 0.08818578720092773, 0.9143473505973816, 0.9359056949615479, 0.11698821187019348, 0.08775793015956879, 0.9653372764587402, 0.1271131932735443, 0.8262357115745544, 0.12698246538639069, 0.888877272605896, 0.04852641373872757, 0.9462650418281555, 0.1268870085477829, 0.8882090449333191, 0.07871497422456741, 0.9445796608924866, 0.21847285330295563, 0.7646549940109253, 0.9533246755599976, 0.033449988812208176, 0.11409993469715118, 0.9127994775772095, 0.09516892582178116, 0.9516893029212952, 0.07606376707553864, 0.9127652049064636, 0.16314178705215454, 0.9788507223129272, 0.9905385375022888, 0.012079738080501556, 0.9929474592208862, 0.012334750965237617, 0.6528642177581787, 0.33852219581604004, 0.1141163632273674, 0.9129309058189392, 0.14272595942020416, 0.8563557267189026, 0.9535784125328064, 0.048214640468358994, 0.8761892914772034, 0.12384301424026489, 0.9365965723991394, 0.07804971933364868, 0.982434868812561, 0.037785954773426056, 0.69368577003479, 0.30348753929138184, 0.9089639186859131, 0.12985199689865112, 0.962058961391449, 0.04182865098118782, 0.9910387396812439, 0.04504721611738205, 0.9821411967277527, 0.023666054010391235, 0.9638254046440125, 0.06884466856718063, 0.9571558237075806, 0.10635064542293549, 0.4810895323753357, 0.5131621360778809, 0.6242544651031494, 0.38644322752952576, 0.8943457007408142, 0.0687958225607872, 0.9701521396636963, 0.03345352038741112, 0.9911425113677979, 0.01032440084964037, 0.9703110456466675, 0.033459000289440155, 0.9531639814376831, 0.050166524946689606, 0.5278578400611877, 0.47758564352989197, 0.6848899722099304, 0.3275560736656189, 0.10376860201358795, 0.9339174032211304, 0.03166516125202179, 0.9710649847984314, 0.031957466155290604, 0.9693764448165894, 0.10380882024765015, 0.9342793822288513, 0.9513100385665894, 0.07317769527435303, 0.9910892248153687, 0.006233265623450279, 0.936201810836792, 0.117025226354599, 0.9513124823570251, 0.07317788153886795, 0.8773672580718994, 0.28088611364364624, 0.7190684080123901, 0.9689068794250488, 0.0403711199760437, 0.9758324027061462, 0.03252774477005005, 0.9098643660545349, 0.12998062372207642, 0.9704049229621887, 0.03346223756670952, 0.11030742526054382, 0.8903384804725647, 0.733495831489563, 0.2681945264339447, 0.04262351617217064, 0.9590290784835815, 0.1524631530046463, 0.8385473489761353, 0.9532743692398071, 0.050172336399555206, 0.05186416953802109, 0.9335550665855408, 0.48547491431236267, 0.5189559459686279], "Term": ["100daysofcode", "100daysofcode", "ai", "ai", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "bigdata", "bigdata", "bragging", "bragging", "datascience", "datascience", "datascientist", "datascientist", "deeplearning", "deeplearning", "dena", "dena", "doe", "doe", "freelancestart", "freelancestart", "gbdt", "gbdt", "gcp", "gcp", "golang", "golang", "iot", "iot", "it", "it", "it\u7d4c\u55b6", "it\u7d4c\u55b6", "javascript", "kaggle", "kaggle", "kaggleguide", "kaggleguide", "kaggler", "kaggler", "kansaiaipub", "lightgbm", "lightgbm", "machinelearning", "machinelearning", "mercariprize", "mercariprize", "ml", "ml", "ncaa", "ncaa", "nodejs", "nodejs", "nodered", "nodered", "note", "note", "pandas", "pandas", "python", "python", "rapidminer", "rapidminer", "santander", "santander", "signate", "signate", "sql", "sql", "superintelligence", "superintelligence", "t5", "t5", "titanic", "titanic", "twitter\u6c42\u4eba", "twitter\u6c42\u4eba", "uber", "uber", "winning", "winning", "xgboost", "xgboost", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "\u30a2\u30f3\u30b5\u30f3\u30d6\u30eb", "\u30a2\u30f3\u30b5\u30f3\u30d6\u30eb", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30b5\u30f3\u30bf\u672c\u6c17\u51fa\u3059", "\u30b5\u30f3\u30bf\u672c\u6c17\u51fa\u3059", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30c7\u30fc\u30bf\u5206\u6790", "\u30c7\u30fc\u30bf\u5206\u6790", "\u30c7\u30fc\u30bf\u89e3\u6790", "\u30c7\u30fc\u30bf\u89e3\u6790", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9\u30b9\u30bf\u30fc\u30c8", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9\u30b9\u30bf\u30fc\u30c8", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u4ea4\u901a\u7d4c\u6e08", "\u4ea4\u901a\u7d4c\u6e08", "\u4eba\u5de5\u77e5\u80fd", "\u4eba\u5de5\u77e5\u80fd", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "\u52c9\u5f37\u4f1a", "\u52c9\u5f37\u4f1a", "\u5916\u8cc7\u7cfb", "\u5916\u8cc7\u7cfb", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5927\u962a", "\u5927\u962a", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "\u6642\u7d661000\u5186", "\u6642\u7d661000\u5186", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u6848\u4ef6\u76f8\u5834", "\u6a5f\u68b0\u5b66\u7fd2", "\u6a5f\u68b0\u5b66\u7fd2", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u6c42\u4eba", "\u6c42\u4eba", "\u7b4b\u30c8\u30ec", "\u7b4b\u30c8\u30ec", "\u7d4c\u6e08\u5b66\u5f92", "\u7d4c\u6e08\u5b66\u5f92", "\u7d71\u8a08", "\u7d71\u8a08", "\u7d71\u8a08\u5b66", "\u7d71\u8a08\u5b66", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406", "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406", "\u90fd\u5e02\u7d4c\u6e08", "\u90fd\u5e02\u7d4c\u6e08", "\u95a2\u897f", "\u95a2\u897f", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044"]}, "R": 30, "lambda.step": 0.01, "plot.opts": {"xlab": "PC1", "ylab": "PC2"}, "topic.order": [1, 2]};
 9 | 
10 | function LDAvis_load_lib(url, callback){
11 |   var s = document.createElement('script');
12 |   s.src = url;
13 |   s.async = true;
14 |   s.onreadystatechange = s.onload = callback;
15 |   s.onerror = function(){console.warn("failed to load library " + url);};
16 |   document.getElementsByTagName("head")[0].appendChild(s);
17 | }
18 | 
19 | if(typeof(LDAvis) !== "undefined"){
20 |    // already loaded: just create the visualization
21 |    !function(LDAvis){
22 |        new LDAvis("#" + "ldavis_el1364554314548401154813291", ldavis_el1364554314548401154813291_data);
23 |    }(LDAvis);
24 | }else if(typeof define === "function" && define.amd){
25 |    // require.js is available: use it to load d3/LDAvis
26 |    require.config({paths: {d3: "https://cdnjs.cloudflare.com/ajax/libs/d3/3.5.5/d3.min"}});
27 |    require(["d3"], function(d3){
28 |       window.d3 = d3;
29 |       LDAvis_load_lib("https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.js", function(){
30 |         new LDAvis("#" + "ldavis_el1364554314548401154813291", ldavis_el1364554314548401154813291_data);
31 |       });
32 |     });
33 | }else{
34 |     // require.js not available: dynamically load d3 & LDAvis
35 |     LDAvis_load_lib("https://cdnjs.cloudflare.com/ajax/libs/d3/3.5.5/d3.min.js", function(){
36 |          LDAvis_load_lib("https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.js", function(){
37 |                  new LDAvis("#" + "ldavis_el1364554314548401154813291", ldavis_el1364554314548401154813291_data);
38 |             })
39 |          });
40 | }
41 | </script>


--------------------------------------------------------------------------------
/nlp/twitter_analytics_using_nlplot/2020-05-18_pyldavis.html:
--------------------------------------------------------------------------------
 1 | 
 2 | <link rel="stylesheet" type="text/css" href="https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.css">
 3 | 
 4 | 
 5 | <div id="ldavis_el9529749609063602302636074"></div>
 6 | <script type="text/javascript">
 7 | 
 8 | var ldavis_el9529749609063602302636074_data = {"mdsDat": {"x": [0.14732801914215088, -0.14732801914215088], "y": [0.0, 0.0], "topics": [1, 2], "cluster": [1, 1], "Freq": [54.23051834106445, 45.76948165893555]}, "tinfo": {"Category": ["Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2"], "Freq": [1083.0, 1291.0, 373.0, 215.0, 193.0, 143.0, 165.0, 160.0, 162.0, 445.0, 93.0, 94.0, 93.0, 126.0, 84.0, 59.0, 59.0, 59.0, 41.0, 59.0, 59.0, 59.0, 184.0, 309.0, 24.0, 30.0, 25.0, 40.0, 26.0, 23.0, 159.1615447998047, 192.03477478027344, 160.61325073242188, 163.70472717285156, 82.86725616455078, 25.845924377441406, 21.581838607788086, 58.06324005126953, 23.222187042236328, 57.8823356628418, 29.681936264038086, 57.521446228027344, 13.140117645263672, 13.11875057220459, 13.117197036743164, 57.3104133605957, 23.732013702392578, 12.26113510131836, 18.796680450439453, 57.19434356689453, 355.6851501464844, 56.94751739501953, 13.729220390319824, 8.042810440063477, 8.026191711425781, 9.6015625, 7.945532321929932, 8.738409042358398, 7.138285160064697, 6.3428497314453125, 13.41327953338623, 1131.92236328125, 13.374342918395996, 12.518911361694336, 23.42352294921875, 226.88595581054688, 13.766777038574219, 79.88345336914062, 27.04385757446289, 125.40335845947266, 22.63872528076172, 60.304473876953125, 29.066852569580078, 20.645004272460938, 22.969127655029297, 83.40772247314453, 20.752046585083008, 139.58328247070312, 91.32024383544922, 91.79608154296875, 90.27067565917969, 39.439064025878906, 17.422725677490234, 10.748383522033691, 23.112539291381836, 12.357230186462402, 8.23248291015625, 7.3996076583862305, 18.083534240722656, 8.187993049621582, 13.905789375305176, 23.55620574951172, 8.11656379699707, 8.920405387878418, 13.751631736755371, 1000.2832641601562, 8.05480670928955, 7.246626853942871, 5.631561279296875, 5.627683639526367, 5.624212741851807, 5.6226372718811035, 6.418981075286865, 5.609947204589844, 196.89468383789062, 17.56036376953125, 5.578864574432373, 113.30939483642578, 13.53644847869873, 13.522589683532715, 9.544998168945312, 19.937145233154297, 7.172063827514648, 13.91380500793457, 33.347042083740234, 319.61688232421875, 19.261877059936523, 124.07888793945312, 10.850387573242188, 13.34872055053711, 11.343375205993652, 10.637520790100098, 13.892083168029785, 30.668466567993164, 82.59089660644531, 160.03582763671875, 22.895910263061523, 35.442535400390625, 19.03139305114746, 16.472131729125977, 17.645444869995117, 14.312366485595703], "Term": ["kaggle", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "python", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "machinelearning", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u6642\u7d661000\u5186", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u6a5f\u68b0\u5b66\u7fd2", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5916\u8cc7\u7cfb", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u7d71\u8a08", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u7d4c\u6e08\u5b66\u5f92", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "superintelligence", "uber", "\u90fd\u5e02\u7d4c\u6e08", "\u4ea4\u901a\u7d4c\u6e08", "ai", "\u7d71\u8a08\u5b66", "deeplearning", "\u6c42\u4eba", "titanic", "100daysofcode", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u6642\u7d661000\u5186", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u7d4c\u6e08\u5b66\u5f92", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u6c42\u4eba", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "doe", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "uber", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "\u90fd\u5e02\u7d4c\u6e08", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u4ea4\u901a\u7d4c\u6e08", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "freelancestart", "it\u7d4c\u55b6", "rapidminer", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9\u30b9\u30bf\u30fc\u30c8", "\u7b4b\u30c8\u30ec", "\u6848\u4ef6\u76f8\u5834", "bigdata", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "mercariprize", "datascientist", "\u7d71\u8a08\u5b66", "\u30c7\u30fc\u30bf\u89e3\u6790", "\u30c7\u30fc\u30bf\u5206\u6790", "\u30a8\u30f3\u30b8\u30cb\u30a2", "\u6a5f\u68b0\u5b66\u7fd2", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "ai", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "datascience", "kaggle", "\u4eba\u5de5\u77e5\u80fd", "machinelearning", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5916\u8cc7\u7cfb", "\u7d71\u8a08\u5b66\u5c02\u653b", "superintelligence", "bragging", "santander", "deeplearning", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "winning", "javascript", "\u95a2\u897f", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "kaggleguide", "titanic", "lightgbm", "\u52c9\u5f37\u4f1a", "ml", "kaggle", "ncaa", "gbdt", "kansaiaipub", "gcp", "golang", "nodered", "\u30b5\u30f3\u30bf\u672c\u6c17\u51fa\u3059", "nodejs", "python", "\u5927\u962a", "\u30a2\u30f3\u30b5\u30f3\u30d6\u30eb", "\u7d71\u8a08", "kaggler", "it", "xgboost", "iot", "t5", "sql", "100daysofcode", "\u6a5f\u68b0\u5b66\u7fd2", "dena", "ai", "note", "signate", "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406", "pandas", "twitter\u6c42\u4eba", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u7d71\u8a08\u5b66", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "datascience", "\u30c7\u30fc\u30bf\u5206\u6790", "\u4eba\u5de5\u77e5\u80fd", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u30a8\u30f3\u30b8\u30cb\u30a2"], "Total": [1083.0, 1291.0, 373.0, 215.0, 193.0, 143.0, 165.0, 160.0, 162.0, 445.0, 93.0, 94.0, 93.0, 126.0, 84.0, 59.0, 59.0, 59.0, 41.0, 59.0, 59.0, 59.0, 184.0, 309.0, 24.0, 30.0, 25.0, 40.0, 26.0, 23.0, 160.42955017089844, 193.71583557128906, 162.14352416992188, 165.56649780273438, 84.50923156738281, 26.464859008789062, 22.198930740356445, 59.768863677978516, 23.907058715820312, 59.7746467590332, 30.742984771728516, 59.78443908691406, 13.664724349975586, 13.66533088684082, 13.665366172790527, 59.79075241088867, 24.77018165588379, 12.812346458435059, 19.64603042602539, 59.793907165527344, 373.3305969238281, 59.80083465576172, 14.525452613830566, 8.545166015625, 8.545663833618164, 10.255602836608887, 8.547869682312012, 9.402857780456543, 7.693454265594482, 6.838641166687012, 14.534539222717285, 1291.958251953125, 14.5357666015625, 13.682260513305664, 26.535221099853516, 309.47686767578125, 15.402151107788086, 115.32598876953125, 41.356224060058594, 445.0202331542969, 33.582035064697266, 184.38336181640625, 59.735321044921875, 33.64012908935547, 45.86503601074219, 1083.6910400390625, 39.78343963623047, 143.019287109375, 93.8747787475586, 94.74134063720703, 93.84490966796875, 41.21466827392578, 18.409175872802734, 11.394981384277344, 24.542604446411133, 13.14686393737793, 8.764246940612793, 7.8875885009765625, 19.2811336517334, 8.762985229492188, 14.896851539611816, 25.408126831054688, 8.760986328125, 9.636826515197754, 14.892617225646973, 1083.6910400390625, 8.759186744689941, 7.883160591125488, 6.131120681762695, 6.13102388381958, 6.130922317504883, 6.130888938903809, 7.006433963775635, 6.130496978759766, 215.4542236328125, 19.266185760498047, 6.129637241363525, 126.91802215576172, 14.886463165283203, 14.885948181152344, 10.507631301879883, 22.74604606628418, 7.881027698516846, 15.750205993652344, 40.18912124633789, 445.0202331542969, 22.726892471313477, 184.38336181640625, 12.250751495361328, 15.7340087890625, 13.117923736572266, 12.24471664428711, 18.308910369873047, 59.735321044921875, 309.47686767578125, 1291.958251953125, 45.86503601074219, 115.32598876953125, 39.78343963623047, 31.179227828979492, 373.3305969238281, 41.356224060058594], "loglift": [30.0, 29.0, 28.0, 27.0, 26.0, 25.0, 24.0, 23.0, 22.0, 21.0, 20.0, 19.0, 18.0, 17.0, 16.0, 15.0, 14.0, 13.0, 12.0, 11.0, 10.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.6039999723434448, 0.6032000184059143, 0.602400004863739, 0.600600004196167, 0.5922999978065491, 0.5882999897003174, 0.5837000012397766, 0.5830000042915344, 0.5828999876976013, 0.579800009727478, 0.5767999887466431, 0.5733000040054321, 0.5727999806404114, 0.5710999965667725, 0.5709999799728394, 0.569599986076355, 0.569100022315979, 0.5680000185966492, 0.5677000284194946, 0.5674999952316284, 0.5634999871253967, 0.5630000233650208, 0.5555999875068665, 0.5512999892234802, 0.5491999983787537, 0.5460000038146973, 0.5389000177383423, 0.5386000275611877, 0.5370000004768372, 0.5367000102996826, 0.5315999984741211, 0.4796999990940094, 0.5286999940872192, 0.5231000185012817, 0.487199991941452, 0.30149999260902405, 0.49970000982284546, 0.24469999969005585, 0.18719999492168427, -0.654699981212616, 0.2176000028848648, -0.5056999921798706, -0.10840000212192535, 0.12370000034570694, -0.07959999889135361, -1.9524999856948853, -0.03889999911189079, 0.7572000026702881, 0.7540000081062317, 0.75, 0.7426999807357788, 0.737500011920929, 0.7264999747276306, 0.7231000065803528, 0.7214999794960022, 0.7196000218391418, 0.718999981880188, 0.7177000045776367, 0.7174000144004822, 0.713699996471405, 0.7127000093460083, 0.7059000134468079, 0.7052000164985657, 0.7042999863624573, 0.7017999887466431, 0.7014999985694885, 0.697700023651123, 0.6973999738693237, 0.6966000199317932, 0.695900022983551, 0.6952999830245972, 0.6949999928474426, 0.6940000057220459, 0.692799985408783, 0.6915000081062317, 0.6887999773025513, 0.6873999834060669, 0.6680999994277954, 0.6865000128746033, 0.6855000257492065, 0.6855000257492065, 0.6496999859809875, 0.6873000264167786, 0.6575999855995178, 0.5949000120162964, 0.4505999982357025, 0.616100013256073, 0.3855000138282776, 0.6601999998092651, 0.6171000003814697, 0.6362000107765198, 0.6407999992370605, 0.5055000185966492, 0.11490000039339066, -0.5393999814987183, -1.3070000410079956, 0.0868000015616417, -0.3982999920845032, 0.044199999421834946, 0.14350000023841858, -2.270400047302246, -0.27950000762939453], "logprob": [30.0, 29.0, 28.0, 27.0, 26.0, 25.0, 24.0, 23.0, 22.0, 21.0, 20.0, 19.0, 18.0, 17.0, 16.0, 15.0, 14.0, 13.0, 12.0, 11.0, 10.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, -3.5892999172210693, -3.4014999866485596, -3.580199956893921, -3.561199903488159, -4.242000102996826, -5.407100200653076, -5.587399959564209, -4.597700119018555, -5.514100074768066, -4.600800037384033, -5.268700122833252, -4.607100009918213, -6.083600044250488, -6.08519983291626, -6.085299968719482, -4.6107001304626465, -5.492400169372559, -6.1528000831604, -5.725500106811523, -4.612800121307373, -2.7852001190185547, -4.617099761962891, -6.039700031280518, -6.574399948120117, -6.576499938964844, -6.397299766540527, -6.586599826812744, -6.491499900817871, -6.69379997253418, -6.8119001388549805, -6.063000202178955, -1.6275999546051025, -6.065899848937988, -6.131999969482422, -5.505499839782715, -3.234800100326538, -6.0370001792907715, -4.27869987487793, -5.361800193786621, -3.827699899673462, -5.539599895477295, -4.559800148010254, -5.289599895477295, -5.631800174713135, -5.525100231170654, -4.235499858856201, -5.6265997886657715, -3.5508999824523926, -3.9751999378204346, -3.9700000286102295, -3.986799955368042, -4.814799785614014, -5.631800174713135, -6.114799976348877, -5.3491997718811035, -5.975399971008301, -6.381499767303467, -6.4882001876831055, -5.594600200653076, -6.386899948120117, -5.8572998046875, -5.3302001953125, -6.395699977874756, -6.301300048828125, -5.8684000968933105, -1.5815999507904053, -6.403299808502197, -6.509099960327148, -6.761199951171875, -6.761899948120117, -6.762499809265137, -6.762800216674805, -6.630300045013428, -6.765100002288818, -3.206899881362915, -5.624000072479248, -6.770599842071533, -3.759500026702881, -5.884200096130371, -5.885200023651123, -6.23360013961792, -5.497000217437744, -6.519400119781494, -5.8566999435424805, -4.982600212097168, -2.7225000858306885, -5.531499862670898, -3.6686999797821045, -6.105400085449219, -5.898200035095215, -6.060999870300293, -6.125199794769287, -5.85830020904541, -5.066400051116943, -4.075699806213379, -3.4142000675201416, -5.35860013961792, -4.9217000007629395, -5.543499946594238, -5.687900066375732, -5.619100093841553, -5.828499794006348]}, "token.table": {"Topic": [1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 2, 1, 2, 1, 2, 1, 2, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2], "Freq": [0.17417648434638977, 0.8211177587509155, 0.3254089653491974, 0.672511875629425, 0.9671164751052856, 0.05090086907148361, 0.8944212198257446, 0.0688016340136528, 0.05432073771953583, 0.9234525561332703, 0.5014713406562805, 0.5014713406562805, 0.866772472858429, 0.11305728554725647, 0.04074547067284584, 0.9371458292007446, 0.13200220465660095, 0.8360139727592468, 0.9513547420501709, 0.07318112999200821, 0.9361472725868225, 0.11701840907335281, 0.12685267627239227, 0.8879687190055847, 0.16310489177703857, 0.9786293506622314, 0.16310758888721466, 0.9786455631256104, 0.13189105689525604, 0.8792737126350403, 0.06717744469642639, 0.9404842853546143, 0.9750767350196838, 0.09750767797231674, 0.8874702453613281, 0.07659009844064713, 0.922772228717804, 0.06712827831506729, 0.9397959113121033, 0.06717512011528015, 0.9404517412185669, 0.9786139130592346, 0.11414240300655365, 0.9131392240524292, 0.020976191386580467, 0.9788889288902283, 0.9501354098320007, 0.07308733463287354, 0.06714736670255661, 0.9400631189346313, 0.11416584998369217, 0.9133267998695374, 0.16311891376972198, 0.9787134528160095, 0.1631084829568863, 0.9786509275436401, 0.08162764459848404, 0.897904098033905, 0.16333575546741486, 0.8983466625213623, 0.08818578720092773, 0.9143473505973816, 0.9359056949615479, 0.11698821187019348, 0.08775793015956879, 0.9653372764587402, 0.1271131932735443, 0.8262357115745544, 0.12698246538639069, 0.888877272605896, 0.04852641373872757, 0.9462650418281555, 0.1268870085477829, 0.8882090449333191, 0.07871497422456741, 0.9445796608924866, 0.21847285330295563, 0.7646549940109253, 0.9533246755599976, 0.033449988812208176, 0.11409993469715118, 0.9127994775772095, 0.09516892582178116, 0.9516893029212952, 0.07606376707553864, 0.9127652049064636, 0.16314178705215454, 0.9788507223129272, 0.9905385375022888, 0.012079738080501556, 0.9929474592208862, 0.012334750965237617, 0.6528642177581787, 0.33852219581604004, 0.1141163632273674, 0.9129309058189392, 0.14272595942020416, 0.8563557267189026, 0.9535784125328064, 0.048214640468358994, 0.8761892914772034, 0.12384301424026489, 0.9365965723991394, 0.07804971933364868, 0.982434868812561, 0.037785954773426056, 0.69368577003479, 0.30348753929138184, 0.9089639186859131, 0.12985199689865112, 0.962058961391449, 0.04182865098118782, 0.9910387396812439, 0.04504721611738205, 0.9821411967277527, 0.023666054010391235, 0.9638254046440125, 0.06884466856718063, 0.9571558237075806, 0.10635064542293549, 0.4810895323753357, 0.5131621360778809, 0.6242544651031494, 0.38644322752952576, 0.8943457007408142, 0.0687958225607872, 0.9701521396636963, 0.03345352038741112, 0.9911425113677979, 0.01032440084964037, 0.9703110456466675, 0.033459000289440155, 0.9531639814376831, 0.050166524946689606, 0.5278578400611877, 0.47758564352989197, 0.6848899722099304, 0.3275560736656189, 0.10376860201358795, 0.9339174032211304, 0.03166516125202179, 0.9710649847984314, 0.031957466155290604, 0.9693764448165894, 0.10380882024765015, 0.9342793822288513, 0.9513100385665894, 0.07317769527435303, 0.9910892248153687, 0.006233265623450279, 0.936201810836792, 0.117025226354599, 0.9513124823570251, 0.07317788153886795, 0.8773672580718994, 0.28088611364364624, 0.7190684080123901, 0.9689068794250488, 0.0403711199760437, 0.9758324027061462, 0.03252774477005005, 0.9098643660545349, 0.12998062372207642, 0.9704049229621887, 0.03346223756670952, 0.11030742526054382, 0.8903384804725647, 0.733495831489563, 0.2681945264339447, 0.04262351617217064, 0.9590290784835815, 0.1524631530046463, 0.8385473489761353, 0.9532743692398071, 0.050172336399555206, 0.05186416953802109, 0.9335550665855408, 0.48547491431236267, 0.5189559459686279], "Term": ["100daysofcode", "100daysofcode", "ai", "ai", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "bigdata", "bigdata", "bragging", "bragging", "datascience", "datascience", "datascientist", "datascientist", "deeplearning", "deeplearning", "dena", "dena", "doe", "doe", "freelancestart", "freelancestart", "gbdt", "gbdt", "gcp", "gcp", "golang", "golang", "iot", "iot", "it", "it", "it\u7d4c\u55b6", "it\u7d4c\u55b6", "javascript", "kaggle", "kaggle", "kaggleguide", "kaggleguide", "kaggler", "kaggler", "kansaiaipub", "lightgbm", "lightgbm", "machinelearning", "machinelearning", "mercariprize", "mercariprize", "ml", "ml", "ncaa", "ncaa", "nodejs", "nodejs", "nodered", "nodered", "note", "note", "pandas", "pandas", "python", "python", "rapidminer", "rapidminer", "santander", "santander", "signate", "signate", "sql", "sql", "superintelligence", "superintelligence", "t5", "t5", "titanic", "titanic", "twitter\u6c42\u4eba", "twitter\u6c42\u4eba", "uber", "uber", "winning", "winning", "xgboost", "xgboost", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "\u30a2\u30f3\u30b5\u30f3\u30d6\u30eb", "\u30a2\u30f3\u30b5\u30f3\u30d6\u30eb", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30b5\u30f3\u30bf\u672c\u6c17\u51fa\u3059", "\u30b5\u30f3\u30bf\u672c\u6c17\u51fa\u3059", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30c7\u30fc\u30bf\u5206\u6790", "\u30c7\u30fc\u30bf\u5206\u6790", "\u30c7\u30fc\u30bf\u89e3\u6790", "\u30c7\u30fc\u30bf\u89e3\u6790", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9\u30b9\u30bf\u30fc\u30c8", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9\u30b9\u30bf\u30fc\u30c8", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u4ea4\u901a\u7d4c\u6e08", "\u4ea4\u901a\u7d4c\u6e08", "\u4eba\u5de5\u77e5\u80fd", "\u4eba\u5de5\u77e5\u80fd", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "\u52c9\u5f37\u4f1a", "\u52c9\u5f37\u4f1a", "\u5916\u8cc7\u7cfb", "\u5916\u8cc7\u7cfb", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5927\u962a", "\u5927\u962a", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "\u6642\u7d661000\u5186", "\u6642\u7d661000\u5186", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u6848\u4ef6\u76f8\u5834", "\u6a5f\u68b0\u5b66\u7fd2", "\u6a5f\u68b0\u5b66\u7fd2", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u6c42\u4eba", "\u6c42\u4eba", "\u7b4b\u30c8\u30ec", "\u7b4b\u30c8\u30ec", "\u7d4c\u6e08\u5b66\u5f92", "\u7d4c\u6e08\u5b66\u5f92", "\u7d71\u8a08", "\u7d71\u8a08", "\u7d71\u8a08\u5b66", "\u7d71\u8a08\u5b66", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406", "\u81ea\u7136\u8a00\u8a9e\u51e6\u7406", "\u90fd\u5e02\u7d4c\u6e08", "\u90fd\u5e02\u7d4c\u6e08", "\u95a2\u897f", "\u95a2\u897f", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044"]}, "R": 30, "lambda.step": 0.01, "plot.opts": {"xlab": "PC1", "ylab": "PC2"}, "topic.order": [1, 2]};
 9 | 
10 | function LDAvis_load_lib(url, callback){
11 |   var s = document.createElement('script');
12 |   s.src = url;
13 |   s.async = true;
14 |   s.onreadystatechange = s.onload = callback;
15 |   s.onerror = function(){console.warn("failed to load library " + url);};
16 |   document.getElementsByTagName("head")[0].appendChild(s);
17 | }
18 | 
19 | if(typeof(LDAvis) !== "undefined"){
20 |    // already loaded: just create the visualization
21 |    !function(LDAvis){
22 |        new LDAvis("#" + "ldavis_el9529749609063602302636074", ldavis_el9529749609063602302636074_data);
23 |    }(LDAvis);
24 | }else if(typeof define === "function" && define.amd){
25 |    // require.js is available: use it to load d3/LDAvis
26 |    require.config({paths: {d3: "https://cdnjs.cloudflare.com/ajax/libs/d3/3.5.5/d3.min"}});
27 |    require(["d3"], function(d3){
28 |       window.d3 = d3;
29 |       LDAvis_load_lib("https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.js", function(){
30 |         new LDAvis("#" + "ldavis_el9529749609063602302636074", ldavis_el9529749609063602302636074_data);
31 |       });
32 |     });
33 | }else{
34 |     // require.js not available: dynamically load d3 & LDAvis
35 |     LDAvis_load_lib("https://cdnjs.cloudflare.com/ajax/libs/d3/3.5.5/d3.min.js", function(){
36 |          LDAvis_load_lib("https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.js", function(){
37 |                  new LDAvis("#" + "ldavis_el9529749609063602302636074", ldavis_el9529749609063602302636074_data);
38 |             })
39 |          });
40 | }
41 | </script>


--------------------------------------------------------------------------------
/nlp/twitter_analytics_using_nlplot/2020-05-19_pyldavis.html:
--------------------------------------------------------------------------------
 1 | 
 2 | <link rel="stylesheet" type="text/css" href="https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.css">
 3 | 
 4 | 
 5 | <div id="ldavis_el9495029960344908182359"></div>
 6 | <script type="text/javascript">
 7 | 
 8 | var ldavis_el9495029960344908182359_data = {"mdsDat": {"x": [0.08507826179265976, -0.08507826179265976], "y": [0.0, 0.0], "topics": [1, 2], "cluster": [1, 1], "Freq": [55.547279357910156, 44.452728271484375]}, "tinfo": {"Category": ["Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Default", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic1", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2", "Topic2"], "Freq": [1118.0, 1254.0, 151.0, 224.0, 185.0, 360.0, 153.0, 155.0, 158.0, 99.0, 99.0, 98.0, 131.0, 81.0, 447.0, 43.0, 187.0, 57.0, 25.0, 57.0, 23.0, 25.0, 19.0, 21.0, 22.0, 29.0, 58.0, 26.0, 20.0, 20.0, 148.139404296875, 177.83096313476562, 148.51284790039062, 150.3623809814453, 23.90237808227539, 75.8281021118164, 19.888795852661133, 12.205190658569336, 12.096857070922852, 21.143798828125, 12.071135520935059, 11.28732681274414, 7.416586399078369, 11.830483436584473, 16.955379486083984, 8.824893951416016, 26.400760650634766, 7.331339359283447, 5.821953296661377, 316.46844482421875, 50.329010009765625, 5.0215888023376465, 4.299502849578857, 4.296092987060547, 12.156294822692871, 20.727739334106445, 4.282054901123047, 6.416611194610596, 4.9841837882995605, 4.270104885101318, 49.4443244934082, 1036.5765380859375, 12.086219787597656, 47.684112548828125, 11.852518081665039, 46.65896987915039, 46.09611511230469, 211.5517120361328, 44.90209197998047, 74.87315368652344, 31.280288696289062, 208.8214569091797, 18.050920486450195, 23.015308380126953, 283.5564270019531, 19.326858520507812, 73.92188262939453, 22.589630126953125, 33.40374755859375, 42.72516632080078, 21.71718406677246, 30.836101531982422, 20.26271629333496, 138.98013305664062, 7.638558864593506, 8.38965892791748, 89.51300048828125, 4.154171466827393, 4.1230692863464355, 88.53765869140625, 5.71305513381958, 4.891557216644287, 10.591197967529297, 4.055782318115234, 4.863410949707031, 5.663389682769775, 8.088595390319824, 4.037878513336182, 5.643208026885986, 5.6340484619140625, 4.806705951690674, 4.7999267578125, 3.996717929840088, 3.9955880641937256, 4.787808895111084, 5.560306072235107, 3.1651840209960938, 3.952822208404541, 84.48169708251953, 3.153836727142334, 3.1530377864837646, 4.702119827270508, 3.119171142578125, 36.538238525390625, 21.82358741760254, 16.304656982421875, 11.664970397949219, 181.93724060058594, 19.8364315032959, 835.1500244140625, 100.68860626220703, 12.95047664642334, 12.889805793762207, 8.544553756713867, 15.907875061035156, 15.886061668395996, 12.53409481048584, 7.668686866760254, 113.75929260253906, 19.57229232788086, 238.686279296875, 10.217283248901367, 11.872101783752441, 24.502803802490234, 11.36962890625, 93.41694641113281, 217.84288024902344, 26.186647415161133, 39.25775909423828, 19.786212921142578, 18.099977493286133, 44.197792053222656, 12.973491668701172, 13.5967435836792, 13.79161548614502], "Term": ["kaggle", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "machinelearning", "python", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u6642\u7d661000\u5186", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5916\u8cc7\u7cfb", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u7d71\u8a08", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u6a5f\u68b0\u5b66\u7fd2", "superintelligence", "ai", "\u7d4c\u6e08\u5b66\u5f92", "deeplearning", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "iot", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "bragging", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u6c42\u4eba", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "titanic", "\u5927\u962a", "\u95a2\u897f", "\u6642\u7d661000\u5186", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "doe", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "mercariprize", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "it\u7d4c\u55b6", "\u6c42\u4eba", "freelancestart", "\u6848\u4ef6\u76f8\u5834", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u7d4c\u6e08\u5b66\u5f92", "\u30c7\u30fc\u30bf\u6d3b\u7528", "\u30a8\u30af\u30b9\u30d7\u30ed\u30e9\u30c8\u30ea\u30fc", "ibmspss", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u897f\u7530\u52d8\u4e00\u90ce", "\u7b4b\u30c8\u30ec", "\u30ec\u30b3\u30e1\u30f3\u30c9", "\u30a8\u30f3\u30b8\u30cb\u30a2\u8ee2\u8077", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "bigdata", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "uber", "\u90fd\u5e02\u7d4c\u6e08", "\u7d71\u8a08\u5b66", "\u4ea4\u901a\u7d4c\u6e08", "\u30c7\u30fc\u30bf\u5206\u6790", "datascience", "\u6a5f\u68b0\u5b66\u7fd2", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "kaggle", "datascientist", "ai", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "python", "\u4eba\u5de5\u77e5\u80fd", "\u7d71\u8a08", "100daysofcode", "machinelearning", "javascript", "winning", "\u5916\u8cc7\u7cfb\u4f01\u696d", "deep", "machine", "\u5916\u8cc7\u7cfb", "kansaiaipub", "\u8133\u6ce2", "santander", "\u30c1\u30e5\u30fc\u30c8\u30ea\u30a2\u30eb", "word2vec", "gcp", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "kernel", "golang", "nodered", "\u30e1\u30eb\u30ab\u30ea", "\u5927\u5b66\u767a", "\u5730\u57df\u79d1\u5b66", "\u521d\u5fc3\u8005\u5411\u3051", "\u6280\u8853\u66f8\u5178", "nodejs", "logisticregression", "\u91cf\u5b50\u30b3\u30f3\u30d4\u30e5\u30fc\u30bf", "\u7d71\u8a08\u5b66\u5c02\u653b", "ibmdojo", "\u5927\u5b66\u9662\u4fee\u58eb", "pytorch", "\u6295\u7968", "superintelligence", "deeplearning", "bragging", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "python", "iot", "kaggle", "\u7d71\u8a08", "it", "ml", "\u52c9\u5f37\u4f1a", "\u5927\u962a", "\u95a2\u897f", "kaggleguide", "lightgbm", "ai", "titanic", "\u6a5f\u68b0\u5b66\u7fd2", "note", "sql", "\u30a8\u30f3\u30b8\u30cb\u30a2", "signate", "\u7d71\u8a08\u5b66", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30c7\u30fc\u30bf\u5206\u6790", "100daysofcode", "\u4eba\u5de5\u77e5\u80fd", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "dena", "datascience", "\u4ea4\u901a\u7d4c\u6e08"], "Total": [1118.0, 1254.0, 151.0, 224.0, 185.0, 360.0, 153.0, 155.0, 158.0, 99.0, 99.0, 98.0, 131.0, 81.0, 447.0, 43.0, 187.0, 57.0, 25.0, 57.0, 23.0, 25.0, 19.0, 21.0, 22.0, 29.0, 58.0, 26.0, 20.0, 20.0, 153.2428741455078, 185.20816040039062, 155.06568908691406, 158.53988647460938, 25.3525447845459, 81.04905700683594, 21.288393020629883, 13.105953216552734, 13.123123168945312, 22.96908950805664, 13.127164840698242, 12.311966896057129, 8.22504997253418, 13.165610313415527, 18.93457794189453, 9.882019996643066, 29.657590866088867, 8.238725662231445, 6.597639083862305, 360.6662292480469, 57.82984924316406, 5.784577369689941, 4.958719253540039, 4.9593048095703125, 14.054410934448242, 23.976821899414062, 4.96156644821167, 7.443853855133057, 5.790388584136963, 4.9636077880859375, 57.974342346191406, 1254.41943359375, 14.065717697143555, 58.251060485839844, 14.10372543334961, 58.41606903076172, 58.50464630126953, 304.9686584472656, 58.69370651245117, 114.13091278076172, 44.87703323364258, 447.50775146484375, 23.463542938232422, 33.022029876708984, 1118.7064208984375, 26.08376121520996, 187.68118286132812, 33.09010696411133, 59.59039306640625, 224.66241455078125, 39.817161560058594, 131.5247039794922, 40.048927307128906, 151.40406799316406, 8.354763984680176, 9.269575119018555, 99.15034484863281, 4.629244327545166, 4.624871253967285, 99.82669830322266, 6.466637134552002, 5.5420308113098145, 12.006973266601562, 4.6154656410217285, 5.538036346435547, 6.459677696228027, 9.227805137634277, 4.613115310668945, 6.456888675689697, 6.455685138702393, 5.530399322509766, 5.529430866241455, 4.607381820678711, 4.607214450836182, 5.527660369873047, 6.445372104644775, 3.6814804077148438, 4.601387977600098, 98.4564208984375, 3.6798207759857178, 3.6798501014709473, 5.516014575958252, 3.675138473510742, 43.1656608581543, 25.72521209716797, 19.284339904785156, 13.777559280395508, 224.66241455078125, 23.82864761352539, 1118.7064208984375, 131.5247039794922, 15.577102661132812, 15.569130897521973, 10.102046966552734, 20.04140853881836, 20.038253784179688, 15.519182205200195, 9.170108795166016, 187.68118286132812, 26.225317001342773, 447.50775146484375, 12.766533851623535, 16.239900588989258, 42.322776794433594, 16.170164108276367, 304.9686584472656, 1254.41943359375, 59.59039306640625, 114.13091278076172, 40.048927307128906, 39.817161560058594, 360.6662292480469, 22.882408142089844, 44.87703323364258, 58.69370651245117], "loglift": [30.0, 29.0, 28.0, 27.0, 26.0, 25.0, 24.0, 23.0, 22.0, 21.0, 20.0, 19.0, 18.0, 17.0, 16.0, 15.0, 14.0, 13.0, 12.0, 11.0, 10.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.554099977016449, 0.5472999811172485, 0.5447999835014343, 0.5350000262260437, 0.5289999842643738, 0.521399974822998, 0.5199000239372253, 0.516700029373169, 0.5065000057220459, 0.5051000118255615, 0.5041000247001648, 0.5009999871253967, 0.484499990940094, 0.48100000619888306, 0.47749999165534973, 0.4747999906539917, 0.4715999960899353, 0.47119998931884766, 0.4629000127315521, 0.45719999074935913, 0.4490000009536743, 0.4465000033378601, 0.44530001282691956, 0.44440001249313354, 0.44279998540878296, 0.4422999918460846, 0.4406000077724457, 0.43939998745918274, 0.43799999356269836, 0.4374000132083893, 0.42879998683929443, 0.39719998836517334, 0.43630000948905945, 0.387800008058548, 0.414000004529953, 0.36320000886917114, 0.3495999872684479, 0.22220000624656677, 0.32010000944137573, 0.1664000004529953, 0.22699999809265137, -0.17430000007152557, 0.3257000148296356, 0.22689999639987946, -0.784600019454956, 0.288100004196167, -0.34380000829696655, 0.2062000036239624, 0.009100000374019146, -1.0719000101089478, -0.018300000578165054, -0.8626000285148621, -0.0934000015258789, 0.7250999808311462, 0.7210999727249146, 0.7110000252723694, 0.7085000276565552, 0.7024999856948853, 0.695900022983551, 0.6906999945640564, 0.6868000030517578, 0.6858999729156494, 0.6852999925613403, 0.6815000176429749, 0.6808000206947327, 0.6791999936103821, 0.6790000200271606, 0.6776000261306763, 0.6759999990463257, 0.6746000051498413, 0.6704999804496765, 0.6693000197410583, 0.6686000227928162, 0.6682999730110168, 0.6671000123023987, 0.6629999876022339, 0.659600019454956, 0.6588000059127808, 0.6577000021934509, 0.656499981880188, 0.6561999917030334, 0.6510999798774719, 0.6467000246047974, 0.64410001039505, 0.6463000178337097, 0.6428999900817871, 0.6442999839782715, 0.5997999906539917, 0.6273999810218811, 0.5184000134468079, 0.5436000227928162, 0.6261000037193298, 0.6219000220298767, 0.6432999968528748, 0.579800009727478, 0.578499972820282, 0.597100019454956, 0.6319000124931335, 0.3100999891757965, 0.5181000232696533, 0.18219999969005585, 0.5879999995231628, 0.4975000023841858, 0.26420000195503235, 0.4584999978542328, -0.3723999857902527, -0.9398999810218811, -0.011500000022351742, -0.2565000057220459, 0.10559999942779541, 0.02239999920129776, -1.2884999513626099, 0.24330000579357147, -0.38339999318122864, -0.637499988079071], "logprob": [30.0, 29.0, 28.0, 27.0, 26.0, 25.0, 24.0, 23.0, 22.0, 21.0, 20.0, 19.0, 18.0, 17.0, 16.0, 15.0, 14.0, 13.0, 12.0, 11.0, 10.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, -3.6851000785827637, -3.5023999214172363, -3.682499885559082, -3.6702001094818115, -5.509200096130371, -4.354700088500977, -5.6930999755859375, -6.181399822235107, -6.190299987792969, -5.631899833679199, -6.192399978637695, -6.259500026702881, -6.679500102996826, -6.212500095367432, -5.85260009765625, -6.5055999755859375, -5.409800052642822, -6.691100120544434, -6.921599864959717, -2.9260001182556152, -4.764599800109863, -7.069499969482422, -7.224699974060059, -7.225500106811523, -6.185400009155273, -5.651700019836426, -7.228799819946289, -6.8242998123168945, -7.076900005340576, -7.231599807739258, -4.782400131225586, -1.7395000457763672, -6.191199779510498, -4.818600177764893, -6.210700035095215, -4.840400218963623, -4.852499961853027, -3.328700065612793, -4.878699779510498, -4.367400169372559, -5.240200042724609, -3.3417000770568848, -5.789999961853027, -5.547100067138672, -3.035799980163574, -5.721700191497803, -4.380199909210205, -5.565700054168701, -5.174499988555908, -4.928400039672852, -5.605100154876709, -5.254499912261963, -5.6743998527526855, -3.526099920272827, -6.427199840545654, -6.333399772644043, -3.9660000801086426, -7.036300182342529, -7.043799877166748, -3.9769999980926514, -6.717700004577637, -6.872900009155273, -6.100399971008301, -7.060299873352051, -6.878699779510498, -6.726399898529053, -6.369999885559082, -7.064700126647949, -6.730000019073486, -6.731599807739258, -6.890399932861328, -6.8917999267578125, -7.074900150299072, -7.075200080871582, -6.8942999839782715, -6.744800090789795, -7.308199882507324, -7.085999965667725, -4.023900032043457, -7.311800003051758, -7.311999797821045, -6.912399768829346, -7.322800159454346, -4.861999988555908, -5.377399921417236, -5.669000148773193, -6.003799915313721, -3.256700038909912, -5.472899913787842, -1.732800006866455, -3.848400115966797, -5.8993000984191895, -5.9039998054504395, -6.315100193023682, -5.693600177764893, -5.695000171661377, -5.932000160217285, -6.423299789428711, -3.726300001144409, -5.486299991607666, -2.985300064086914, -6.136300086975098, -5.986199855804443, -5.261600017547607, -6.0295000076293945, -3.92330002784729, -3.0766000747680664, -5.195199966430664, -4.790299892425537, -5.475399971008301, -5.564499855041504, -4.6717000007629395, -5.897500038146973, -5.850599765777588, -5.836299896240234]}, "token.table": {"Topic": [1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2], "Freq": [0.4993891417980194, 0.4993891417980194, 0.3942856788635254, 0.6074130535125732, 0.8978282809257507, 0.10562685877084732, 0.8531381487846375, 0.14218968152999878, 0.15556664764881134, 0.8296887278556824, 0.690776526927948, 0.31196358799934387, 0.7284225821495056, 0.2683662176132202, 0.8640719056129456, 0.1554894894361496, 0.8551921844482422, 0.43701693415641785, 0.5681220293045044, 0.9156144261360168, 0.0763012021780014, 0.8496459722518921, 0.12137799710035324, 0.1548064798116684, 0.9288389086723328, 0.15487335622310638, 0.9292401075363159, 0.27175235748291016, 0.8152570724487305, 0.8065646886825562, 0.20164117217063904, 0.16786517202854156, 0.8393258452415466, 0.1925903707742691, 0.8345583081245422, 0.9107449650764465, 0.1011938825249672, 0.11969219148159027, 0.9575375318527222, 0.2538646459579468, 0.7463977932929993, 0.19330915808677673, 0.837673008441925, 0.15463988482952118, 0.9278392791748047, 0.21677325665950775, 0.867093026638031, 0.2180999219417572, 0.8723996877670288, 0.27162986993789673, 0.8148895502090454, 0.21622224152088165, 0.8648889660835266, 0.07925810664892197, 0.9180730581283569, 0.9114655256271362, 0.07595545798540115, 0.19268898665905, 0.834985613822937, 0.15515008568763733, 0.9309004545211792, 0.15490221977233887, 0.929413378238678, 0.23498938977718353, 0.7832979559898376, 0.1913982778787613, 0.8101043701171875, 0.18129031360149384, 0.9064515829086304, 0.08328493684530258, 0.9161342978477478, 0.30921146273612976, 0.6802651882171631, 0.24630692601203918, 0.7389208078384399, 0.16216593980789185, 0.8571628332138062, 0.2669176459312439, 0.7626218795776367, 0.804573118686676, 0.20542292296886444, 0.10787981003522873, 0.8630384802818298, 0.18056942522525787, 0.9028471112251282, 0.14516359567642212, 0.8709815740585327, 0.9461341500282288, 0.050460487604141235, 0.9608830809593201, 0.04514215886592865, 0.8066598773002625, 0.2016649693250656, 0.4253028929233551, 0.5906984806060791, 0.10836812853813171, 0.8669450283050537, 0.805865466594696, 0.201466366648674, 0.21666286885738373, 0.8666514754295349, 0.8761563301086426, 0.1219964474439621, 0.8266772627830505, 0.17378556728363037, 0.8934397101402283, 0.08122178912162781, 0.946650505065918, 0.03944377228617668, 0.6571400761604309, 0.3417128622531891, 0.8643673658370972, 0.17287348210811615, 0.9142721891403198, 0.08707354217767715, 0.9394791126251221, 0.046973954886198044, 0.9377036690711975, 0.061691030859947205, 0.8538244962692261, 0.14230407774448395, 0.6965047121047974, 0.3028281331062317, 0.8508390188217163, 0.141806498169899, 0.8240193128585815, 0.18883776664733887, 0.96108078956604, 0.03779531270265579, 0.8452014923095703, 0.15524108707904816, 0.18081876635551453, 0.904093861579895, 0.8634998798370361, 0.17269998788833618, 0.7666921019554138, 0.23852641880512238, 0.5525255799293518, 0.4520663917064667, 0.695071816444397, 0.33242565393447876, 0.21705089509487152, 0.8682035803794861, 0.19797967374324799, 0.8909085392951965, 0.21704301238059998, 0.8681720495223999, 0.1101909652352333, 0.8915450572967529, 0.10085693746805191, 0.9077123999595642, 0.18085044622421265, 0.9042521715164185, 0.27175021171569824, 0.81525057554245, 0.19958676397800446, 0.7983470559120178, 0.914416491985321, 0.07620137184858322, 0.18090836703777313, 0.9045418500900269, 0.2720986008644104, 0.8162957429885864, 0.9657871723175049, 0.03262794390320778, 0.8510586619377136, 0.12157981097698212, 0.9141349196434021, 0.07617790997028351, 0.9094161987304688, 0.15156936645507812, 0.46703100204467773, 0.5340689420700073, 0.8758458495140076, 0.1251208335161209, 0.8766726851463318, 0.10115454345941544, 0.8060340881347656, 0.13433901965618134, 0.8646054267883301, 0.13833686709403992, 0.2356971651315689, 0.7679165601730347, 0.6951534152030945, 0.3049493730068207, 0.14219489693641663, 0.853169322013855, 0.1804392784833908, 0.9021963477134705, 0.8061969876289368, 0.2015492469072342, 0.7862623333930969, 0.20511192083358765, 0.21732573211193085, 0.8693029284477234, 0.19961819052696228, 0.7984727621078491, 0.7671476006507874, 0.21309654414653778, 0.5537805557250977, 0.4363119304180145], "Term": ["100daysofcode", "100daysofcode", "ai", "ai", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "ai\u30a8\u30f3\u30b8\u30cb\u30a2", "bigdata", "bigdata", "bragging", "bragging", "datascience", "datascience", "datascientist", "datascientist", "deep", "deeplearning", "deeplearning", "dena", "dena", "doe", "doe", "freelancestart", "freelancestart", "gcp", "gcp", "golang", "golang", "ibmdojo", "ibmdojo", "ibmspss", "ibmspss", "iot", "iot", "it", "it", "it\u7d4c\u55b6", "it\u7d4c\u55b6", "javascript", "javascript", "kaggle", "kaggle", "kaggleguide", "kaggleguide", "kansaiaipub", "kansaiaipub", "kernel", "kernel", "lightgbm", "lightgbm", "logisticregression", "logisticregression", "machine", "machine", "machinelearning", "machinelearning", "mercariprize", "mercariprize", "ml", "ml", "nodejs", "nodejs", "nodered", "nodered", "note", "note", "python", "python", "pytorch", "pytorch", "santander", "santander", "signate", "signate", "sql", "sql", "superintelligence", "superintelligence", "titanic", "titanic", "uber", "uber", "winning", "winning", "word2vec", "word2vec", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "\u306f\u3066\u306a\u30d6\u30ed\u30b0", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30a4\u30f3\u30bf\u30fc\u30f3", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a4\u30f3\u30bf\u30fc\u30f3\u30b7\u30c3\u30d7", "\u30a8\u30af\u30b9\u30d7\u30ed\u30e9\u30c8\u30ea\u30fc", "\u30a8\u30af\u30b9\u30d7\u30ed\u30e9\u30c8\u30ea\u30fc", "\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30a8\u30f3\u30b8\u30cb\u30a2", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u30a8\u30f3\u30b8\u30cb\u30a2\u8ee2\u8077", "\u30a8\u30f3\u30b8\u30cb\u30a2\u8ee2\u8077", "\u30c1\u30e5\u30fc\u30c8\u30ea\u30a2\u30eb", "\u30c1\u30e5\u30fc\u30c8\u30ea\u30a2\u30eb", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30b9", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "\u30c7\u30fc\u30bf\u30b5\u30a4\u30a8\u30f3\u30c6\u30a3\u30b9\u30c8\u3042\u308b\u3042\u308b", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30c7\u30fc\u30bf\u30de\u30a4\u30cb\u30f3\u30b0", "\u30c7\u30fc\u30bf\u5206\u6790", "\u30c7\u30fc\u30bf\u5206\u6790", "\u30c7\u30fc\u30bf\u6d3b\u7528", "\u30c7\u30fc\u30bf\u6d3b\u7528", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u30d0\u30c3\u30af\u30aa\u30d5\u30a3\u30b9", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u30d3\u30b8\u30cd\u30b9\u7d71\u8a08", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30d3\u30c3\u30b0\u30c7\u30fc\u30bf", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u30d5\u30ea\u30fc\u30e9\u30f3\u30b9", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u521d\u5fc3\u8005", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "\u30d7\u30ed\u30b0\u30e9\u30df\u30f3\u30b0\u5b66\u7fd2", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30de\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30de\u30fc\u30b1\u30c6\u30a3\u30f3\u30b0", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30df\u30af\u30ed\u7d4c\u6e08\u5b66", "\u30e1\u30eb\u30ab\u30ea", "\u30e1\u30eb\u30ab\u30ea", "\u30ec\u30b3\u30e1\u30f3\u30c9", "\u30ec\u30b3\u30e1\u30f3\u30c9", "\u4ea4\u901a\u7d4c\u6e08", "\u4ea4\u901a\u7d4c\u6e08", "\u4eba\u5de5\u77e5\u80fd", "\u4eba\u5de5\u77e5\u80fd", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "\u4eca\u65e5\u306e\u7a4d\u307f\u4e0a\u3052", "\u521d\u5fc3\u8005\u5411\u3051", "\u521d\u5fc3\u8005\u5411\u3051", "\u52c9\u5f37\u4f1a", "\u52c9\u5f37\u4f1a", "\u5730\u57df\u79d1\u5b66", "\u5730\u57df\u79d1\u5b66", "\u5916\u8cc7\u7cfb", "\u5916\u8cc7\u7cfb", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5916\u8cc7\u7cfb\u4f01\u696d", "\u5927\u5b66\u767a", "\u5927\u5b66\u767a", "\u5927\u5b66\u9662\u4fee\u58eb", "\u5927\u5b66\u9662\u4fee\u58eb", "\u5927\u962a", "\u5927\u962a", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "\u5b9f\u9a13\u8a08\u753b\u6cd5", "\u6280\u8853\u66f8\u5178", "\u6280\u8853\u66f8\u5178", "\u6295\u7968", "\u6295\u7968", "\u6642\u7d661000\u5186", "\u6642\u7d661000\u5186", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "\u6771\u4eac\u90fd\u6e0b\u8c37\u533a", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u6771\u4eac\u90fd\u6e2f\u533a", "\u6848\u4ef6\u76f8\u5834", "\u6848\u4ef6\u76f8\u5834", "\u6a5f\u68b0\u5b66\u7fd2", "\u6a5f\u68b0\u5b66\u7fd2", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u6a5f\u68b0\u5b66\u7fd2\u30a8\u30f3\u30b8\u30cb\u30a2", "\u6c42\u4eba", "\u6c42\u4eba", "\u7b4b\u30c8\u30ec", "\u7b4b\u30c8\u30ec", "\u7d4c\u6e08\u5b66\u5f92", "\u7d4c\u6e08\u5b66\u5f92", "\u7d71\u8a08", "\u7d71\u8a08", "\u7d71\u8a08\u5b66", "\u7d71\u8a08\u5b66", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u7d71\u8a08\u5b66\u5c02\u653b", "\u8133\u6ce2", "\u8133\u6ce2", "\u897f\u7530\u52d8\u4e00\u90ce", "\u897f\u7530\u52d8\u4e00\u90ce", "\u90fd\u5e02\u7d4c\u6e08", "\u90fd\u5e02\u7d4c\u6e08", "\u91cf\u5b50\u30b3\u30f3\u30d4\u30e5\u30fc\u30bf", "\u91cf\u5b50\u30b3\u30f3\u30d4\u30e5\u30fc\u30bf", "\u95a2\u897f", "\u95a2\u897f", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044", "\u99c6\u3051\u51fa\u3057\u30a8\u30f3\u30b8\u30cb\u30a2\u3068\u7e4b\u304c\u308a\u305f\u3044"]}, "R": 30, "lambda.step": 0.01, "plot.opts": {"xlab": "PC1", "ylab": "PC2"}, "topic.order": [1, 2]};
 9 | 
10 | function LDAvis_load_lib(url, callback){
11 |   var s = document.createElement('script');
12 |   s.src = url;
13 |   s.async = true;
14 |   s.onreadystatechange = s.onload = callback;
15 |   s.onerror = function(){console.warn("failed to load library " + url);};
16 |   document.getElementsByTagName("head")[0].appendChild(s);
17 | }
18 | 
19 | if(typeof(LDAvis) !== "undefined"){
20 |    // already loaded: just create the visualization
21 |    !function(LDAvis){
22 |        new LDAvis("#" + "ldavis_el9495029960344908182359", ldavis_el9495029960344908182359_data);
23 |    }(LDAvis);
24 | }else if(typeof define === "function" && define.amd){
25 |    // require.js is available: use it to load d3/LDAvis
26 |    require.config({paths: {d3: "https://cdnjs.cloudflare.com/ajax/libs/d3/3.5.5/d3.min"}});
27 |    require(["d3"], function(d3){
28 |       window.d3 = d3;
29 |       LDAvis_load_lib("https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.js", function(){
30 |         new LDAvis("#" + "ldavis_el9495029960344908182359", ldavis_el9495029960344908182359_data);
31 |       });
32 |     });
33 | }else{
34 |     // require.js not available: dynamically load d3 & LDAvis
35 |     LDAvis_load_lib("https://cdnjs.cloudflare.com/ajax/libs/d3/3.5.5/d3.min.js", function(){
36 |          LDAvis_load_lib("https://cdn.rawgit.com/bmabey/pyLDAvis/files/ldavis.v1.0.0.js", function(){
37 |                  new LDAvis("#" + "ldavis_el9495029960344908182359", ldavis_el9495029960344908182359_data);
38 |             })
39 |          });
40 | }
41 | </script>


--------------------------------------------------------------------------------
/nlp/twitter_analytics_using_nlplot/merge_data.ipynb:
--------------------------------------------------------------------------------
   1 | {
   2 |  "cells": [
   3 |   {
   4 |    "cell_type": "code",
   5 |    "execution_count": 1,
   6 |    "metadata": {},
   7 |    "outputs": [],
   8 |    "source": [
   9 |     "import pandas as pd"
  10 |    ]
  11 |   },
  12 |   {
  13 |    "cell_type": "code",
  14 |    "execution_count": 13,
  15 |    "metadata": {},
  16 |    "outputs": [],
  17 |    "source": [
  18 |     "df1 = pd.read_csv('twitter_ai.csv')\n",
  19 |     "df2 = pd.read_csv('twitter_ds.csv')\n",
  20 |     "df3 = pd.read_csv('twitter_kaggle.csv')\n",
  21 |     "df4 = pd.read_csv('twitter_python.csv')"
  22 |    ]
  23 |   },
  24 |   {
  25 |    "cell_type": "code",
  26 |    "execution_count": 14,
  27 |    "metadata": {},
  28 |    "outputs": [
  29 |     {
  30 |      "data": {
  31 |       "text/html": [
  32 |        "<div>\n",
  33 |        "<style scoped>\n",
  34 |        "    .dataframe tbody tr th:only-of-type {\n",
  35 |        "        vertical-align: middle;\n",
  36 |        "    }\n",
  37 |        "\n",
  38 |        "    .dataframe tbody tr th {\n",
  39 |        "        vertical-align: top;\n",
  40 |        "    }\n",
  41 |        "\n",
  42 |        "    .dataframe thead th {\n",
  43 |        "        text-align: right;\n",
  44 |        "    }\n",
  45 |        "</style>\n",
  46 |        "<table border=\"1\" class=\"dataframe\">\n",
  47 |        "  <thead>\n",
  48 |        "    <tr style=\"text-align: right;\">\n",
  49 |        "      <th></th>\n",
  50 |        "      <th>searched_for</th>\n",
  51 |        "      <th>post_url</th>\n",
  52 |        "      <th>post</th>\n",
  53 |        "      <th>user</th>\n",
  54 |        "      <th>post_time</th>\n",
  55 |        "      <th>hashtags</th>\n",
  56 |        "      <th>hashtag_len</th>\n",
  57 |        "    </tr>\n",
  58 |        "  </thead>\n",
  59 |        "  <tbody>\n",
  60 |        "    <tr>\n",
  61 |        "      <th>0</th>\n",
  62 |        "      <td>#人工知能</td>\n",
  63 |        "      <td>https://twitter.com/benrishi1/status/125772625...</td>\n",
  64 |        "      <td>経営者が知るべき人工知能が生むビジネスチャンスを つかむための戦略とは？ \\nhttps:/...</td>\n",
  65 |        "      <td>人工知能、機械学習、ＩｏＴニュース</td>\n",
  66 |        "      <td>1.588700e+09</td>\n",
  67 |        "      <td>機械学習 ai iot 人工知能</td>\n",
  68 |        "      <td>4</td>\n",
  69 |        "    </tr>\n",
  70 |        "    <tr>\n",
  71 |        "      <th>1</th>\n",
  72 |        "      <td>#人工知能</td>\n",
  73 |        "      <td>https://twitter.com/ciwame_mizuo/status/124367...</td>\n",
  74 |        "      <td>AIで風景を作る\\niteration/epoch: 11000/2\\n#makeingla...</td>\n",
  75 |        "      <td>みずお</td>\n",
  76 |        "      <td>NaN</td>\n",
  77 |        "      <td>makeinglandscape deeplearning nowlearning ai g...</td>\n",
  78 |        "      <td>6</td>\n",
  79 |        "    </tr>\n",
  80 |        "    <tr>\n",
  81 |        "      <th>2</th>\n",
  82 |        "      <td>#人工知能</td>\n",
  83 |        "      <td>https://twitter.com/sachi_n1020/status/1257695...</td>\n",
  84 |        "      <td>主婦だけど、何か仕事をしたいと思ってませんか？\\nスマホ片手で在宅でできますよ〜\\n#副業 ...</td>\n",
  85 |        "      <td>naru@相互フォロー</td>\n",
  86 |        "      <td>1.588693e+09</td>\n",
  87 |        "      <td>働き方改革 副業探しています 集客 インターネット 社会問題 環境問題 相互フォロー ai ...</td>\n",
  88 |        "      <td>11</td>\n",
  89 |        "    </tr>\n",
  90 |        "    <tr>\n",
  91 |        "      <th>3</th>\n",
  92 |        "      <td>#人工知能</td>\n",
  93 |        "      <td>https://twitter.com/JohnnyFakaHioki/status/124...</td>\n",
  94 |        "      <td>シンギュラリティ後の世界が明るく楽しいものなら、その日を待つためだけに25年生きてもいいな。...</td>\n",
  95 |        "      <td>草木の妖精-ジョニー・フローラ -Johnny Flora-</td>\n",
  96 |        "      <td>NaN</td>\n",
  97 |        "      <td>シンギュラリティ 人工知能</td>\n",
  98 |        "      <td>2</td>\n",
  99 |        "    </tr>\n",
 100 |        "    <tr>\n",
 101 |        "      <th>4</th>\n",
 102 |        "      <td>#人工知能</td>\n",
 103 |        "      <td>https://twitter.com/kawachanaccount/status/125...</td>\n",
 104 |        "      <td>AIは恋する　#小説　#SF　#人工知能　#プログラマー\\nhttps://t.co/oQz...</td>\n",
 105 |        "      <td>KAWAMURA小説アカウント</td>\n",
 106 |        "      <td>1.588693e+09</td>\n",
 107 |        "      <td>小説 プログラマー sf 人工知能</td>\n",
 108 |        "      <td>4</td>\n",
 109 |        "    </tr>\n",
 110 |        "    <tr>\n",
 111 |        "      <th>...</th>\n",
 112 |        "      <td>...</td>\n",
 113 |        "      <td>...</td>\n",
 114 |        "      <td>...</td>\n",
 115 |        "      <td>...</td>\n",
 116 |        "      <td>...</td>\n",
 117 |        "      <td>...</td>\n",
 118 |        "      <td>...</td>\n",
 119 |        "    </tr>\n",
 120 |        "    <tr>\n",
 121 |        "      <th>6507</th>\n",
 122 |        "      <td>#人工知能</td>\n",
 123 |        "      <td>https://twitter.com/ciwame_mizuo/status/124368...</td>\n",
 124 |        "      <td>AIで風景を作る\\niteration/epoch: 12000/2\\n#makeingla...</td>\n",
 125 |        "      <td>みずお</td>\n",
 126 |        "      <td>NaN</td>\n",
 127 |        "      <td>makeinglandscape deeplearning nowlearning ai g...</td>\n",
 128 |        "      <td>6</td>\n",
 129 |        "    </tr>\n",
 130 |        "    <tr>\n",
 131 |        "      <th>6508</th>\n",
 132 |        "      <td>#人工知能</td>\n",
 133 |        "      <td>https://twitter.com/KyukyokuCom/status/1243682...</td>\n",
 134 |        "      <td>人工知能（AI）が米国、数百万人の職を奪う！「やりすぎ都市伝説で言ってた人類選別がはじまる？...</td>\n",
 135 |        "      <td>究極のまとめ.com</td>\n",
 136 |        "      <td>NaN</td>\n",
 137 |        "      <td>都市伝説 やりすぎ都市伝説 ai 人工知能</td>\n",
 138 |        "      <td>4</td>\n",
 139 |        "    </tr>\n",
 140 |        "    <tr>\n",
 141 |        "      <th>6509</th>\n",
 142 |        "      <td>#人工知能</td>\n",
 143 |        "      <td>https://twitter.com/InfoAI4/status/12436819956...</td>\n",
 144 |        "      <td>「なぜ」を理解するAIの構築を、あの人工知能の第一人者は目指している｜https://t.c...</td>\n",
 145 |        "      <td>Info_AI</td>\n",
 146 |        "      <td>NaN</td>\n",
 147 |        "      <td>ai 人工知能</td>\n",
 148 |        "      <td>2</td>\n",
 149 |        "    </tr>\n",
 150 |        "    <tr>\n",
 151 |        "      <th>6510</th>\n",
 152 |        "      <td>#人工知能</td>\n",
 153 |        "      <td>https://twitter.com/meza_janken/status/1243679...</td>\n",
 154 |        "      <td>【2戦目】めざましじゃんけん結果速報：\\nチョキ✌でした。グー✊が勝ちです。\\n今回の相手：...</td>\n",
 155 |        "      <td>めざましじゃんけん結果速報</td>\n",
 156 |        "      <td>NaN</td>\n",
 157 |        "      <td>めざましじゃんけん じゃんけん みきいえ ゆりやんレトリィバァ めざましどようび めざましテ...</td>\n",
 158 |        "      <td>9</td>\n",
 159 |        "    </tr>\n",
 160 |        "    <tr>\n",
 161 |        "      <th>6511</th>\n",
 162 |        "      <td>#人工知能</td>\n",
 163 |        "      <td>https://twitter.com/meza_janken/status/1243678...</td>\n",
 164 |        "      <td>学習中の人工知能なので、とても低い勝率です。\\n次回3月28日 【2戦目】のじゃんけん予想は...</td>\n",
 165 |        "      <td>めざましじゃんけん結果速報</td>\n",
 166 |        "      <td>NaN</td>\n",
 167 |        "      <td>めざましじゃんけん じゃんけん opencv keras raspberrypi rnn め...</td>\n",
 168 |        "      <td>11</td>\n",
 169 |        "    </tr>\n",
 170 |        "  </tbody>\n",
 171 |        "</table>\n",
 172 |        "<p>6512 rows × 7 columns</p>\n",
 173 |        "</div>"
 174 |       ],
 175 |       "text/plain": [
 176 |        "     searched_for                                           post_url  \\\n",
 177 |        "0           #人工知能  https://twitter.com/benrishi1/status/125772625...   \n",
 178 |        "1           #人工知能  https://twitter.com/ciwame_mizuo/status/124367...   \n",
 179 |        "2           #人工知能  https://twitter.com/sachi_n1020/status/1257695...   \n",
 180 |        "3           #人工知能  https://twitter.com/JohnnyFakaHioki/status/124...   \n",
 181 |        "4           #人工知能  https://twitter.com/kawachanaccount/status/125...   \n",
 182 |        "...           ...                                                ...   \n",
 183 |        "6507        #人工知能  https://twitter.com/ciwame_mizuo/status/124368...   \n",
 184 |        "6508        #人工知能  https://twitter.com/KyukyokuCom/status/1243682...   \n",
 185 |        "6509        #人工知能  https://twitter.com/InfoAI4/status/12436819956...   \n",
 186 |        "6510        #人工知能  https://twitter.com/meza_janken/status/1243679...   \n",
 187 |        "6511        #人工知能  https://twitter.com/meza_janken/status/1243678...   \n",
 188 |        "\n",
 189 |        "                                                   post  \\\n",
 190 |        "0     経営者が知るべき人工知能が生むビジネスチャンスを つかむための戦略とは？ \\nhttps:/...   \n",
 191 |        "1     AIで風景を作る\\niteration/epoch: 11000/2\\n#makeingla...   \n",
 192 |        "2     主婦だけど、何か仕事をしたいと思ってませんか？\\nスマホ片手で在宅でできますよ〜\\n#副業 ...   \n",
 193 |        "3     シンギュラリティ後の世界が明るく楽しいものなら、その日を待つためだけに25年生きてもいいな。...   \n",
 194 |        "4     AIは恋する　#小説　#SF　#人工知能　#プログラマー\\nhttps://t.co/oQz...   \n",
 195 |        "...                                                 ...   \n",
 196 |        "6507  AIで風景を作る\\niteration/epoch: 12000/2\\n#makeingla...   \n",
 197 |        "6508  人工知能（AI）が米国、数百万人の職を奪う！「やりすぎ都市伝説で言ってた人類選別がはじまる？...   \n",
 198 |        "6509  「なぜ」を理解するAIの構築を、あの人工知能の第一人者は目指している｜https://t.c...   \n",
 199 |        "6510  【2戦目】めざましじゃんけん結果速報：\\nチョキ✌でした。グー✊が勝ちです。\\n今回の相手：...   \n",
 200 |        "6511  学習中の人工知能なので、とても低い勝率です。\\n次回3月28日 【2戦目】のじゃんけん予想は...   \n",
 201 |        "\n",
 202 |        "                                user     post_time  \\\n",
 203 |        "0                  人工知能、機械学習、ＩｏＴニュース  1.588700e+09   \n",
 204 |        "1                                みずお           NaN   \n",
 205 |        "2                        naru@相互フォロー  1.588693e+09   \n",
 206 |        "3     草木の妖精-ジョニー・フローラ -Johnny Flora-           NaN   \n",
 207 |        "4                    KAWAMURA小説アカウント  1.588693e+09   \n",
 208 |        "...                              ...           ...   \n",
 209 |        "6507                             みずお           NaN   \n",
 210 |        "6508                      究極のまとめ.com           NaN   \n",
 211 |        "6509                         Info_AI           NaN   \n",
 212 |        "6510                   めざましじゃんけん結果速報           NaN   \n",
 213 |        "6511                   めざましじゃんけん結果速報           NaN   \n",
 214 |        "\n",
 215 |        "                                               hashtags  hashtag_len  \n",
 216 |        "0                                      機械学習 ai iot 人工知能            4  \n",
 217 |        "1     makeinglandscape deeplearning nowlearning ai g...            6  \n",
 218 |        "2     働き方改革 副業探しています 集客 インターネット 社会問題 環境問題 相互フォロー ai ...           11  \n",
 219 |        "3                                         シンギュラリティ 人工知能            2  \n",
 220 |        "4                                     小説 プログラマー sf 人工知能            4  \n",
 221 |        "...                                                 ...          ...  \n",
 222 |        "6507  makeinglandscape deeplearning nowlearning ai g...            6  \n",
 223 |        "6508                              都市伝説 やりすぎ都市伝説 ai 人工知能            4  \n",
 224 |        "6509                                            ai 人工知能            2  \n",
 225 |        "6510  めざましじゃんけん じゃんけん みきいえ ゆりやんレトリィバァ めざましどようび めざましテ...            9  \n",
 226 |        "6511  めざましじゃんけん じゃんけん opencv keras raspberrypi rnn め...           11  \n",
 227 |        "\n",
 228 |        "[6512 rows x 7 columns]"
 229 |       ]
 230 |      },
 231 |      "execution_count": 14,
 232 |      "metadata": {},
 233 |      "output_type": "execute_result"
 234 |     }
 235 |    ],
 236 |    "source": [
 237 |     "df1"
 238 |    ]
 239 |   },
 240 |   {
 241 |    "cell_type": "code",
 242 |    "execution_count": 15,
 243 |    "metadata": {},
 244 |    "outputs": [
 245 |     {
 246 |      "data": {
 247 |       "text/html": [
 248 |        "<div>\n",
 249 |        "<style scoped>\n",
 250 |        "    .dataframe tbody tr th:only-of-type {\n",
 251 |        "        vertical-align: middle;\n",
 252 |        "    }\n",
 253 |        "\n",
 254 |        "    .dataframe tbody tr th {\n",
 255 |        "        vertical-align: top;\n",
 256 |        "    }\n",
 257 |        "\n",
 258 |        "    .dataframe thead th {\n",
 259 |        "        text-align: right;\n",
 260 |        "    }\n",
 261 |        "</style>\n",
 262 |        "<table border=\"1\" class=\"dataframe\">\n",
 263 |        "  <thead>\n",
 264 |        "    <tr style=\"text-align: right;\">\n",
 265 |        "      <th></th>\n",
 266 |        "      <th>searched_for</th>\n",
 267 |        "      <th>post_url</th>\n",
 268 |        "      <th>post</th>\n",
 269 |        "      <th>user</th>\n",
 270 |        "      <th>post_time</th>\n",
 271 |        "      <th>hashtags</th>\n",
 272 |        "      <th>hashtag_len</th>\n",
 273 |        "    </tr>\n",
 274 |        "  </thead>\n",
 275 |        "  <tbody>\n",
 276 |        "    <tr>\n",
 277 |        "      <th>0</th>\n",
 278 |        "      <td>#データサイエンティスト</td>\n",
 279 |        "      <td>https://twitter.com/K03475916/status/125781058...</td>\n",
 280 |        "      <td>#今日の積み上げ\\n・Udemy中級編7.8\\n・DS養成講座30回31回課題\\n・prog...</td>\n",
 281 |        "      <td>K</td>\n",
 282 |        "      <td>1.588720e+09</td>\n",
 283 |        "      <td>筋トレ 今日の積み上げ 駆け出しエンジニアと繋がりたい データサイエンティスト</td>\n",
 284 |        "      <td>4</td>\n",
 285 |        "    </tr>\n",
 286 |        "    <tr>\n",
 287 |        "      <th>1</th>\n",
 288 |        "      <td>#データサイエンティスト</td>\n",
 289 |        "      <td>https://twitter.com/ponpoko_code/status/844690...</td>\n",
 290 |        "      <td>データ分析って給料高いな～。人材不足らしい。統計学、プログラミングに加えて人工知能も出来ると...</td>\n",
 291 |        "      <td>ぽんぽこ@プロぽこ-プログラミング</td>\n",
 292 |        "      <td>NaN</td>\n",
 293 |        "      <td>統計学 人工知能 ダイヤモンド データサイエンティスト プログラミング</td>\n",
 294 |        "      <td>5</td>\n",
 295 |        "    </tr>\n",
 296 |        "    <tr>\n",
 297 |        "      <th>2</th>\n",
 298 |        "      <td>#データサイエンティスト</td>\n",
 299 |        "      <td>https://twitter.com/sazan_dora/status/79743408...</td>\n",
 300 |        "      <td>データサイエンティストになりたい人向けまとめ - NAVER まとめ https://t.c...</td>\n",
 301 |        "      <td>サザンドラ</td>\n",
 302 |        "      <td>NaN</td>\n",
 303 |        "      <td>データマイニング データサイエンス データサイエンティスト</td>\n",
 304 |        "      <td>3</td>\n",
 305 |        "    </tr>\n",
 306 |        "    <tr>\n",
 307 |        "      <th>3</th>\n",
 308 |        "      <td>#データサイエンティスト</td>\n",
 309 |        "      <td>https://twitter.com/WXBC_jp/status/11302604362...</td>\n",
 310 |        "      <td>【#野球 ネタ⚾️】\\n\\n#ヤクルトスワローズ の #山田哲人 選手の成績データを、気温・...</td>\n",
 311 |        "      <td>気象ビジネス推進コンソーシアム（略称：WXBC,事務局：気象庁）</td>\n",
 312 |        "      <td>NaN</td>\n",
 313 |        "      <td>山田哲人 気象 データサイエンティスト ヤクルトスワローズ</td>\n",
 314 |        "      <td>4</td>\n",
 315 |        "    </tr>\n",
 316 |        "    <tr>\n",
 317 |        "      <th>4</th>\n",
 318 |        "      <td>#データサイエンティスト</td>\n",
 319 |        "      <td>https://twitter.com/hamahiroshi164/status/1257...</td>\n",
 320 |        "      <td>「データサイエンティストを目指す人のzoom飲み会」終わりました💡\\n\\n現場のリアルが知れ...</td>\n",
 321 |        "      <td>DSになる男ハマヒロシ30歳子煩悩</td>\n",
 322 |        "      <td>1.588689e+09</td>\n",
 323 |        "      <td>プログラミング初心者 データサイエンティスト</td>\n",
 324 |        "      <td>2</td>\n",
 325 |        "    </tr>\n",
 326 |        "    <tr>\n",
 327 |        "      <th>...</th>\n",
 328 |        "      <td>...</td>\n",
 329 |        "      <td>...</td>\n",
 330 |        "      <td>...</td>\n",
 331 |        "      <td>...</td>\n",
 332 |        "      <td>...</td>\n",
 333 |        "      <td>...</td>\n",
 334 |        "      <td>...</td>\n",
 335 |        "    </tr>\n",
 336 |        "    <tr>\n",
 337 |        "      <th>1484</th>\n",
 338 |        "      <td>#データサイエンティスト</td>\n",
 339 |        "      <td>https://twitter.com/Iggjj21/status/12162382360...</td>\n",
 340 |        "      <td>#今日の積み上げ \\n\\n✔️PYQでpandasの演習\\n→主に表の作成方法\\n✔️cou...</td>\n",
 341 |        "      <td>ゆう|新社会人エンジニア</td>\n",
 342 |        "      <td>NaN</td>\n",
 343 |        "      <td>駆け出しエンジニア python 今日の積み上げ 機械学習 データサイエンティスト ai 駆...</td>\n",
 344 |        "      <td>7</td>\n",
 345 |        "    </tr>\n",
 346 |        "    <tr>\n",
 347 |        "      <th>1485</th>\n",
 348 |        "      <td>#データサイエンティスト</td>\n",
 349 |        "      <td>https://twitter.com/fumi_bz/status/10116001000...</td>\n",
 350 |        "      <td>Agile HR Day にて。そもそもいないデータサイエンティスト人材‥っていう、スライド...</td>\n",
 351 |        "      <td>fumi@HR Tech商品企画</td>\n",
 352 |        "      <td>NaN</td>\n",
 353 |        "      <td>機械学習 hrtech ディープラーニング データサイエンティスト</td>\n",
 354 |        "      <td>4</td>\n",
 355 |        "    </tr>\n",
 356 |        "    <tr>\n",
 357 |        "      <th>1486</th>\n",
 358 |        "      <td>#データサイエンティスト</td>\n",
 359 |        "      <td>https://twitter.com/joe_i/status/1794720198705...</td>\n",
 360 |        "      <td>#データサイエンティスト 不足の問題は昨日も話題に上がってましたが、本当にそうですよねー。昨...</td>\n",
 361 |        "      <td>石山 城 / Joe ISHIYAMA</td>\n",
 362 |        "      <td>NaN</td>\n",
 363 |        "      <td>データサイエンティスト opencu</td>\n",
 364 |        "      <td>2</td>\n",
 365 |        "    </tr>\n",
 366 |        "    <tr>\n",
 367 |        "      <th>1487</th>\n",
 368 |        "      <td>#データサイエンティスト</td>\n",
 369 |        "      <td>https://twitter.com/intern_aogaku/status/79775...</td>\n",
 370 |        "      <td>統計学を学ぶ学生必見！\\n\\nIoT企業でデータサイエンティストの有給インターンシップ募集！...</td>\n",
 371 |        "      <td>青山学院大学 インターン就活おすすめ情報</td>\n",
 372 |        "      <td>NaN</td>\n",
 373 |        "      <td>インターンシップ インターン マーケティング データサイエンス データサイエンティスト 統計...</td>\n",
 374 |        "      <td>7</td>\n",
 375 |        "    </tr>\n",
 376 |        "    <tr>\n",
 377 |        "      <th>1488</th>\n",
 378 |        "      <td>#データサイエンティスト</td>\n",
 379 |        "      <td>https://twitter.com/shibaurakogyo_u/status/797...</td>\n",
 380 |        "      <td>統計学を学ぶ学生必見！\\n\\nIoT企業でデータサイエンティストの有給インターンシップ募集！...</td>\n",
 381 |        "      <td>芝浦工業大学 インターン就活おすすめ情報</td>\n",
 382 |        "      <td>NaN</td>\n",
 383 |        "      <td>インターンシップ インターン マーケティング データサイエンス データサイエンティスト 統計...</td>\n",
 384 |        "      <td>7</td>\n",
 385 |        "    </tr>\n",
 386 |        "  </tbody>\n",
 387 |        "</table>\n",
 388 |        "<p>1489 rows × 7 columns</p>\n",
 389 |        "</div>"
 390 |       ],
 391 |       "text/plain": [
 392 |        "      searched_for                                           post_url  \\\n",
 393 |        "0     #データサイエンティスト  https://twitter.com/K03475916/status/125781058...   \n",
 394 |        "1     #データサイエンティスト  https://twitter.com/ponpoko_code/status/844690...   \n",
 395 |        "2     #データサイエンティスト  https://twitter.com/sazan_dora/status/79743408...   \n",
 396 |        "3     #データサイエンティスト  https://twitter.com/WXBC_jp/status/11302604362...   \n",
 397 |        "4     #データサイエンティスト  https://twitter.com/hamahiroshi164/status/1257...   \n",
 398 |        "...            ...                                                ...   \n",
 399 |        "1484  #データサイエンティスト  https://twitter.com/Iggjj21/status/12162382360...   \n",
 400 |        "1485  #データサイエンティスト  https://twitter.com/fumi_bz/status/10116001000...   \n",
 401 |        "1486  #データサイエンティスト  https://twitter.com/joe_i/status/1794720198705...   \n",
 402 |        "1487  #データサイエンティスト  https://twitter.com/intern_aogaku/status/79775...   \n",
 403 |        "1488  #データサイエンティスト  https://twitter.com/shibaurakogyo_u/status/797...   \n",
 404 |        "\n",
 405 |        "                                                   post  \\\n",
 406 |        "0     #今日の積み上げ\\n・Udemy中級編7.8\\n・DS養成講座30回31回課題\\n・prog...   \n",
 407 |        "1     データ分析って給料高いな～。人材不足らしい。統計学、プログラミングに加えて人工知能も出来ると...   \n",
 408 |        "2     データサイエンティストになりたい人向けまとめ - NAVER まとめ https://t.c...   \n",
 409 |        "3     【#野球 ネタ⚾️】\\n\\n#ヤクルトスワローズ の #山田哲人 選手の成績データを、気温・...   \n",
 410 |        "4     「データサイエンティストを目指す人のzoom飲み会」終わりました💡\\n\\n現場のリアルが知れ...   \n",
 411 |        "...                                                 ...   \n",
 412 |        "1484  #今日の積み上げ \\n\\n✔️PYQでpandasの演習\\n→主に表の作成方法\\n✔️cou...   \n",
 413 |        "1485  Agile HR Day にて。そもそもいないデータサイエンティスト人材‥っていう、スライド...   \n",
 414 |        "1486  #データサイエンティスト 不足の問題は昨日も話題に上がってましたが、本当にそうですよねー。昨...   \n",
 415 |        "1487  統計学を学ぶ学生必見！\\n\\nIoT企業でデータサイエンティストの有給インターンシップ募集！...   \n",
 416 |        "1488  統計学を学ぶ学生必見！\\n\\nIoT企業でデータサイエンティストの有給インターンシップ募集！...   \n",
 417 |        "\n",
 418 |        "                                  user     post_time  \\\n",
 419 |        "0                                    K  1.588720e+09   \n",
 420 |        "1                    ぽんぽこ@プロぽこ-プログラミング           NaN   \n",
 421 |        "2                                サザンドラ           NaN   \n",
 422 |        "3     気象ビジネス推進コンソーシアム（略称：WXBC,事務局：気象庁）           NaN   \n",
 423 |        "4                    DSになる男ハマヒロシ30歳子煩悩  1.588689e+09   \n",
 424 |        "...                                ...           ...   \n",
 425 |        "1484                      ゆう|新社会人エンジニア           NaN   \n",
 426 |        "1485                  fumi@HR Tech商品企画           NaN   \n",
 427 |        "1486               石山 城 / Joe ISHIYAMA           NaN   \n",
 428 |        "1487              青山学院大学 インターン就活おすすめ情報           NaN   \n",
 429 |        "1488              芝浦工業大学 インターン就活おすすめ情報           NaN   \n",
 430 |        "\n",
 431 |        "                                               hashtags  hashtag_len  \n",
 432 |        "0               筋トレ 今日の積み上げ 駆け出しエンジニアと繋がりたい データサイエンティスト            4  \n",
 433 |        "1                   統計学 人工知能 ダイヤモンド データサイエンティスト プログラミング            5  \n",
 434 |        "2                         データマイニング データサイエンス データサイエンティスト            3  \n",
 435 |        "3                         山田哲人 気象 データサイエンティスト ヤクルトスワローズ            4  \n",
 436 |        "4                                プログラミング初心者 データサイエンティスト            2  \n",
 437 |        "...                                                 ...          ...  \n",
 438 |        "1484  駆け出しエンジニア python 今日の積み上げ 機械学習 データサイエンティスト ai 駆...            7  \n",
 439 |        "1485                  機械学習 hrtech ディープラーニング データサイエンティスト            4  \n",
 440 |        "1486                                 データサイエンティスト opencu            2  \n",
 441 |        "1487  インターンシップ インターン マーケティング データサイエンス データサイエンティスト 統計...            7  \n",
 442 |        "1488  インターンシップ インターン マーケティング データサイエンス データサイエンティスト 統計...            7  \n",
 443 |        "\n",
 444 |        "[1489 rows x 7 columns]"
 445 |       ]
 446 |      },
 447 |      "execution_count": 15,
 448 |      "metadata": {},
 449 |      "output_type": "execute_result"
 450 |     }
 451 |    ],
 452 |    "source": [
 453 |     "df2"
 454 |    ]
 455 |   },
 456 |   {
 457 |    "cell_type": "code",
 458 |    "execution_count": 16,
 459 |    "metadata": {},
 460 |    "outputs": [
 461 |     {
 462 |      "data": {
 463 |       "text/html": [
 464 |        "<div>\n",
 465 |        "<style scoped>\n",
 466 |        "    .dataframe tbody tr th:only-of-type {\n",
 467 |        "        vertical-align: middle;\n",
 468 |        "    }\n",
 469 |        "\n",
 470 |        "    .dataframe tbody tr th {\n",
 471 |        "        vertical-align: top;\n",
 472 |        "    }\n",
 473 |        "\n",
 474 |        "    .dataframe thead th {\n",
 475 |        "        text-align: right;\n",
 476 |        "    }\n",
 477 |        "</style>\n",
 478 |        "<table border=\"1\" class=\"dataframe\">\n",
 479 |        "  <thead>\n",
 480 |        "    <tr style=\"text-align: right;\">\n",
 481 |        "      <th></th>\n",
 482 |        "      <th>searched_for</th>\n",
 483 |        "      <th>post_url</th>\n",
 484 |        "      <th>post</th>\n",
 485 |        "      <th>user</th>\n",
 486 |        "      <th>post_time</th>\n",
 487 |        "      <th>hashtags</th>\n",
 488 |        "      <th>hashtag_len</th>\n",
 489 |        "    </tr>\n",
 490 |        "  </thead>\n",
 491 |        "  <tbody>\n",
 492 |        "    <tr>\n",
 493 |        "      <th>0</th>\n",
 494 |        "      <td>#kaggle</td>\n",
 495 |        "      <td>https://twitter.com/AbeShumpei/status/11002246...</td>\n",
 496 |        "      <td>はじめて出して見た。8000番と順位は低いけどこれからがんばるぞいDoing my part...</td>\n",
 497 |        "      <td>abe shumpei</td>\n",
 498 |        "      <td>NaN</td>\n",
 499 |        "      <td>kaggle machinelearning</td>\n",
 500 |        "      <td>2</td>\n",
 501 |        "    </tr>\n",
 502 |        "    <tr>\n",
 503 |        "      <th>1</th>\n",
 504 |        "      <td>#kaggle</td>\n",
 505 |        "      <td>https://twitter.com/soh_1121_/status/125767813...</td>\n",
 506 |        "      <td>◯ 実施内容\\n・ #Paiza 1h\\n・ #言語処理100本ノック 0.5h\\n・ #K...</td>\n",
 507 |        "      <td>Soh</td>\n",
 508 |        "      <td>1.588689e+09</td>\n",
 509 |        "      <td>言語処理100本ノック apg4b 個人開発 kaggle 今日の積み上げ 駆け出しエンジニ...</td>\n",
 510 |        "      <td>9</td>\n",
 511 |        "    </tr>\n",
 512 |        "    <tr>\n",
 513 |        "      <th>2</th>\n",
 514 |        "      <td>#kaggle</td>\n",
 515 |        "      <td>https://twitter.com/WlWH74jtP0zHxmj/status/125...</td>\n",
 516 |        "      <td>AIの目標はやっぱりKaggleかな\\nグランドマスターとか憧れすぎる\\nいろいろ挑戦してみ...</td>\n",
 517 |        "      <td>やますん@駆け出しエンジニア</td>\n",
 518 |        "      <td>1.588677e+09</td>\n",
 519 |        "      <td>プログラミング学習 ai kaggle</td>\n",
 520 |        "      <td>3</td>\n",
 521 |        "    </tr>\n",
 522 |        "    <tr>\n",
 523 |        "      <th>3</th>\n",
 524 |        "      <td>#kaggle</td>\n",
 525 |        "      <td>https://twitter.com/bonjinjpn/status/110005131...</td>\n",
 526 |        "      <td>#SIGNATE - Data Science Competition #ML #DL #A...</td>\n",
 527 |        "      <td>K2</td>\n",
 528 |        "      <td>NaN</td>\n",
 529 |        "      <td>dl signate kaggle ai ml</td>\n",
 530 |        "      <td>5</td>\n",
 531 |        "    </tr>\n",
 532 |        "    <tr>\n",
 533 |        "      <th>4</th>\n",
 534 |        "      <td>#kaggle</td>\n",
 535 |        "      <td>https://twitter.com/tkydub/status/109950639977...</td>\n",
 536 |        "      <td>届きました🙌 #kaggle #機械学習 #機械学習のための特徴量エンジニアリング</td>\n",
 537 |        "      <td>toki⛅</td>\n",
 538 |        "      <td>NaN</td>\n",
 539 |        "      <td>kaggle 機械学習のための特徴量エンジニアリング 機械学習</td>\n",
 540 |        "      <td>3</td>\n",
 541 |        "    </tr>\n",
 542 |        "    <tr>\n",
 543 |        "      <th>...</th>\n",
 544 |        "      <td>...</td>\n",
 545 |        "      <td>...</td>\n",
 546 |        "      <td>...</td>\n",
 547 |        "      <td>...</td>\n",
 548 |        "      <td>...</td>\n",
 549 |        "      <td>...</td>\n",
 550 |        "      <td>...</td>\n",
 551 |        "    </tr>\n",
 552 |        "    <tr>\n",
 553 |        "      <th>1219</th>\n",
 554 |        "      <td>#kaggle</td>\n",
 555 |        "      <td>https://twitter.com/Wataoka_Koki/status/110109...</td>\n",
 556 |        "      <td>kaggle二日目\\n\\nDNNのkernelを自分好みにアレンジしながら実装した。\\n\\n...</td>\n",
 557 |        "      <td>綿岡 晃輝</td>\n",
 558 |        "      <td>NaN</td>\n",
 559 |        "      <td>santander kaggle</td>\n",
 560 |        "      <td>2</td>\n",
 561 |        "    </tr>\n",
 562 |        "    <tr>\n",
 563 |        "      <th>1220</th>\n",
 564 |        "      <td>#kaggle</td>\n",
 565 |        "      <td>https://twitter.com/codexa_net/status/11010897...</td>\n",
 566 |        "      <td>【Kaggle初心者入門編】タイタニック号で生き残るのは誰？\\n\\n#Kaggle #入門\\...</td>\n",
 567 |        "      <td>codexa[コデクサ:人工知能特化WEBスクール]</td>\n",
 568 |        "      <td>NaN</td>\n",
 569 |        "      <td>入門 kaggle</td>\n",
 570 |        "      <td>2</td>\n",
 571 |        "    </tr>\n",
 572 |        "    <tr>\n",
 573 |        "      <th>1221</th>\n",
 574 |        "      <td>#kaggle</td>\n",
 575 |        "      <td>https://twitter.com/hntk03/status/110099597289...</td>\n",
 576 |        "      <td>Feature Engineering #featureengineering #kaggl...</td>\n",
 577 |        "      <td>hntk</td>\n",
 578 |        "      <td>NaN</td>\n",
 579 |        "      <td>featureengineering kaggle</td>\n",
 580 |        "      <td>2</td>\n",
 581 |        "    </tr>\n",
 582 |        "    <tr>\n",
 583 |        "      <th>1222</th>\n",
 584 |        "      <td>#kaggle</td>\n",
 585 |        "      <td>https://twitter.com/sa178kla/status/1100890178...</td>\n",
 586 |        "      <td>もっと頑張ろうー\\nCausing #superintelligence, one subm...</td>\n",
 587 |        "      <td>yo</td>\n",
 588 |        "      <td>NaN</td>\n",
 589 |        "      <td>superintelligence kaggle</td>\n",
 590 |        "      <td>2</td>\n",
 591 |        "    </tr>\n",
 592 |        "    <tr>\n",
 593 |        "      <th>1223</th>\n",
 594 |        "      <td>#kaggle</td>\n",
 595 |        "      <td>https://twitter.com/dichika/status/29512284824...</td>\n",
 596 |        "      <td>適当にgbmにつっこんだら0.76555で924位ダッタヨ #kaggle #titanic</td>\n",
 597 |        "      <td>棗太郎</td>\n",
 598 |        "      <td>NaN</td>\n",
 599 |        "      <td>titanic kaggle</td>\n",
 600 |        "      <td>2</td>\n",
 601 |        "    </tr>\n",
 602 |        "  </tbody>\n",
 603 |        "</table>\n",
 604 |        "<p>1224 rows × 7 columns</p>\n",
 605 |        "</div>"
 606 |       ],
 607 |       "text/plain": [
 608 |        "     searched_for                                           post_url  \\\n",
 609 |        "0         #kaggle  https://twitter.com/AbeShumpei/status/11002246...   \n",
 610 |        "1         #kaggle  https://twitter.com/soh_1121_/status/125767813...   \n",
 611 |        "2         #kaggle  https://twitter.com/WlWH74jtP0zHxmj/status/125...   \n",
 612 |        "3         #kaggle  https://twitter.com/bonjinjpn/status/110005131...   \n",
 613 |        "4         #kaggle  https://twitter.com/tkydub/status/109950639977...   \n",
 614 |        "...           ...                                                ...   \n",
 615 |        "1219      #kaggle  https://twitter.com/Wataoka_Koki/status/110109...   \n",
 616 |        "1220      #kaggle  https://twitter.com/codexa_net/status/11010897...   \n",
 617 |        "1221      #kaggle  https://twitter.com/hntk03/status/110099597289...   \n",
 618 |        "1222      #kaggle  https://twitter.com/sa178kla/status/1100890178...   \n",
 619 |        "1223      #kaggle  https://twitter.com/dichika/status/29512284824...   \n",
 620 |        "\n",
 621 |        "                                                   post  \\\n",
 622 |        "0     はじめて出して見た。8000番と順位は低いけどこれからがんばるぞいDoing my part...   \n",
 623 |        "1     ◯ 実施内容\\n・ #Paiza 1h\\n・ #言語処理100本ノック 0.5h\\n・ #K...   \n",
 624 |        "2     AIの目標はやっぱりKaggleかな\\nグランドマスターとか憧れすぎる\\nいろいろ挑戦してみ...   \n",
 625 |        "3     #SIGNATE - Data Science Competition #ML #DL #A...   \n",
 626 |        "4             届きました🙌 #kaggle #機械学習 #機械学習のための特徴量エンジニアリング   \n",
 627 |        "...                                                 ...   \n",
 628 |        "1219  kaggle二日目\\n\\nDNNのkernelを自分好みにアレンジしながら実装した。\\n\\n...   \n",
 629 |        "1220  【Kaggle初心者入門編】タイタニック号で生き残るのは誰？\\n\\n#Kaggle #入門\\...   \n",
 630 |        "1221  Feature Engineering #featureengineering #kaggl...   \n",
 631 |        "1222  もっと頑張ろうー\\nCausing #superintelligence, one subm...   \n",
 632 |        "1223     適当にgbmにつっこんだら0.76555で924位ダッタヨ #kaggle #titanic   \n",
 633 |        "\n",
 634 |        "                            user     post_time  \\\n",
 635 |        "0                    abe shumpei           NaN   \n",
 636 |        "1                            Soh  1.588689e+09   \n",
 637 |        "2                 やますん@駆け出しエンジニア  1.588677e+09   \n",
 638 |        "3                             K2           NaN   \n",
 639 |        "4                          toki⛅           NaN   \n",
 640 |        "...                          ...           ...   \n",
 641 |        "1219                       綿岡 晃輝           NaN   \n",
 642 |        "1220  codexa[コデクサ:人工知能特化WEBスクール]           NaN   \n",
 643 |        "1221                        hntk           NaN   \n",
 644 |        "1222                          yo           NaN   \n",
 645 |        "1223                         棗太郎           NaN   \n",
 646 |        "\n",
 647 |        "                                               hashtags  hashtag_len  \n",
 648 |        "0                                kaggle machinelearning            2  \n",
 649 |        "1     言語処理100本ノック apg4b 個人開発 kaggle 今日の積み上げ 駆け出しエンジニ...            9  \n",
 650 |        "2                                   プログラミング学習 ai kaggle            3  \n",
 651 |        "3                               dl signate kaggle ai ml            5  \n",
 652 |        "4                       kaggle 機械学習のための特徴量エンジニアリング 機械学習            3  \n",
 653 |        "...                                                 ...          ...  \n",
 654 |        "1219                                   santander kaggle            2  \n",
 655 |        "1220                                          入門 kaggle            2  \n",
 656 |        "1221                          featureengineering kaggle            2  \n",
 657 |        "1222                           superintelligence kaggle            2  \n",
 658 |        "1223                                     titanic kaggle            2  \n",
 659 |        "\n",
 660 |        "[1224 rows x 7 columns]"
 661 |       ]
 662 |      },
 663 |      "execution_count": 16,
 664 |      "metadata": {},
 665 |      "output_type": "execute_result"
 666 |     }
 667 |    ],
 668 |    "source": [
 669 |     "df3"
 670 |    ]
 671 |   },
 672 |   {
 673 |    "cell_type": "code",
 674 |    "execution_count": 17,
 675 |    "metadata": {},
 676 |    "outputs": [
 677 |     {
 678 |      "data": {
 679 |       "text/html": [
 680 |        "<div>\n",
 681 |        "<style scoped>\n",
 682 |        "    .dataframe tbody tr th:only-of-type {\n",
 683 |        "        vertical-align: middle;\n",
 684 |        "    }\n",
 685 |        "\n",
 686 |        "    .dataframe tbody tr th {\n",
 687 |        "        vertical-align: top;\n",
 688 |        "    }\n",
 689 |        "\n",
 690 |        "    .dataframe thead th {\n",
 691 |        "        text-align: right;\n",
 692 |        "    }\n",
 693 |        "</style>\n",
 694 |        "<table border=\"1\" class=\"dataframe\">\n",
 695 |        "  <thead>\n",
 696 |        "    <tr style=\"text-align: right;\">\n",
 697 |        "      <th></th>\n",
 698 |        "      <th>searched_for</th>\n",
 699 |        "      <th>post_url</th>\n",
 700 |        "      <th>post</th>\n",
 701 |        "      <th>user</th>\n",
 702 |        "      <th>post_time</th>\n",
 703 |        "      <th>hashtags</th>\n",
 704 |        "      <th>hashtag_len</th>\n",
 705 |        "    </tr>\n",
 706 |        "  </thead>\n",
 707 |        "  <tbody>\n",
 708 |        "    <tr>\n",
 709 |        "      <th>0</th>\n",
 710 |        "      <td>#python</td>\n",
 711 |        "      <td>https://twitter.com/joekadowaki/status/1245109...</td>\n",
 712 |        "      <td>｢仕事のムダ｣を省くための、コミュニケーションに関する2つのポイント\\nhttps://t....</td>\n",
 713 |        "      <td>じょー</td>\n",
 714 |        "      <td>NaN</td>\n",
 715 |        "      <td>python technology 駆け出しエンジニアと繋がりたい</td>\n",
 716 |        "      <td>3</td>\n",
 717 |        "    </tr>\n",
 718 |        "    <tr>\n",
 719 |        "      <th>1</th>\n",
 720 |        "      <td>#python</td>\n",
 721 |        "      <td>https://twitter.com/maronaru_sale_t/status/125...</td>\n",
 722 |        "      <td>LINEの半bot、保護botのソースや\\nPythonista3の使い方\\nソースの書き方...</td>\n",
 723 |        "      <td>U&amp;I iryuSale LINEbot販売</td>\n",
 724 |        "      <td>1.588720e+09</td>\n",
 725 |        "      <td>半bot プログラミング pythonista 保護bot linebot python p...</td>\n",
 726 |        "      <td>8</td>\n",
 727 |        "    </tr>\n",
 728 |        "    <tr>\n",
 729 |        "      <th>2</th>\n",
 730 |        "      <td>#python</td>\n",
 731 |        "      <td>https://twitter.com/joekadowaki/status/1245108...</td>\n",
 732 |        "      <td>「ビジネスメール詐欺の実態調査報告書」を公開　JPCERT/CC\\nhttps://t.co...</td>\n",
 733 |        "      <td>じょー</td>\n",
 734 |        "      <td>NaN</td>\n",
 735 |        "      <td>python technology 駆け出しエンジニアと繋がりたい</td>\n",
 736 |        "      <td>3</td>\n",
 737 |        "    </tr>\n",
 738 |        "    <tr>\n",
 739 |        "      <th>3</th>\n",
 740 |        "      <td>#python</td>\n",
 741 |        "      <td>https://twitter.com/sheep_0411/status/12578075...</td>\n",
 742 |        "      <td>日経平均\\n2020年05月01日の終値：19,619.35円\\n(前日比-2.84%)\\n...</td>\n",
 743 |        "      <td>シープ</td>\n",
 744 |        "      <td>1.588720e+09</td>\n",
 745 |        "      <td>heroku bot python 日経平均</td>\n",
 746 |        "      <td>4</td>\n",
 747 |        "    </tr>\n",
 748 |        "    <tr>\n",
 749 |        "      <th>4</th>\n",
 750 |        "      <td>#python</td>\n",
 751 |        "      <td>https://twitter.com/joekadowaki/status/1245108...</td>\n",
 752 |        "      <td>ライス大学研究チーム、GPUを使わずにディープラーニングを高速化するアルゴリズムを開発\\nh...</td>\n",
 753 |        "      <td>じょー</td>\n",
 754 |        "      <td>NaN</td>\n",
 755 |        "      <td>python technology 駆け出しエンジニアと繋がりたい</td>\n",
 756 |        "      <td>3</td>\n",
 757 |        "    </tr>\n",
 758 |        "    <tr>\n",
 759 |        "      <th>...</th>\n",
 760 |        "      <td>...</td>\n",
 761 |        "      <td>...</td>\n",
 762 |        "      <td>...</td>\n",
 763 |        "      <td>...</td>\n",
 764 |        "      <td>...</td>\n",
 765 |        "      <td>...</td>\n",
 766 |        "      <td>...</td>\n",
 767 |        "    </tr>\n",
 768 |        "    <tr>\n",
 769 |        "      <th>5270</th>\n",
 770 |        "      <td>#python</td>\n",
 771 |        "      <td>https://twitter.com/Kuno39962216/status/124511...</td>\n",
 772 |        "      <td>2020年4月1日学習\\n・Udemy 【世界で5万人が受講】実践 Pythonデータサイエ...</td>\n",
 773 |        "      <td>kuno&amp;pandapi</td>\n",
 774 |        "      <td>NaN</td>\n",
 775 |        "      <td>udemy python データサイエンス</td>\n",
 776 |        "      <td>3</td>\n",
 777 |        "    </tr>\n",
 778 |        "    <tr>\n",
 779 |        "      <th>5271</th>\n",
 780 |        "      <td>#python</td>\n",
 781 |        "      <td>https://twitter.com/BASEBALLY15/status/1245109...</td>\n",
 782 |        "      <td>#今日の積み上げ\\n今日も頑張りましょう😊\\n\\n▶️ #Python ブログ執筆\\n▶️ ...</td>\n",
 783 |        "      <td>ゆうき@Python＋C💻ブログで発信📝</td>\n",
 784 |        "      <td>NaN</td>\n",
 785 |        "      <td>今日の積み上げ python 駆け出しエンジニアと繋がりたい</td>\n",
 786 |        "      <td>3</td>\n",
 787 |        "    </tr>\n",
 788 |        "    <tr>\n",
 789 |        "      <th>5272</th>\n",
 790 |        "      <td>#python</td>\n",
 791 |        "      <td>https://twitter.com/joekadowaki/status/1245109...</td>\n",
 792 |        "      <td>リモートワークで疲弊する人へ｜この際、生産性は忘れよう\\nhttps://t.co/mJnU...</td>\n",
 793 |        "      <td>じょー</td>\n",
 794 |        "      <td>NaN</td>\n",
 795 |        "      <td>python technology 駆け出しエンジニアと繋がりたい</td>\n",
 796 |        "      <td>3</td>\n",
 797 |        "    </tr>\n",
 798 |        "    <tr>\n",
 799 |        "      <th>5273</th>\n",
 800 |        "      <td>#python</td>\n",
 801 |        "      <td>https://twitter.com/joekadowaki/status/1245109...</td>\n",
 802 |        "      <td>地頭のいい人≠アイデアマン。｢問題解決｣への最短距離のつくり方\\nhttps://t.co/...</td>\n",
 803 |        "      <td>じょー</td>\n",
 804 |        "      <td>NaN</td>\n",
 805 |        "      <td>python technology 駆け出しエンジニアと繋がりたい</td>\n",
 806 |        "      <td>3</td>\n",
 807 |        "    </tr>\n",
 808 |        "    <tr>\n",
 809 |        "      <th>5274</th>\n",
 810 |        "      <td>#python</td>\n",
 811 |        "      <td>https://twitter.com/joekadowaki/status/1245109...</td>\n",
 812 |        "      <td>オンライン会議を生かす、スムーズな進め方と注意点\\nhttps://t.co/w88CTnb...</td>\n",
 813 |        "      <td>じょー</td>\n",
 814 |        "      <td>NaN</td>\n",
 815 |        "      <td>python technology 駆け出しエンジニアと繋がりたい</td>\n",
 816 |        "      <td>3</td>\n",
 817 |        "    </tr>\n",
 818 |        "  </tbody>\n",
 819 |        "</table>\n",
 820 |        "<p>5275 rows × 7 columns</p>\n",
 821 |        "</div>"
 822 |       ],
 823 |       "text/plain": [
 824 |        "     searched_for                                           post_url  \\\n",
 825 |        "0         #python  https://twitter.com/joekadowaki/status/1245109...   \n",
 826 |        "1         #python  https://twitter.com/maronaru_sale_t/status/125...   \n",
 827 |        "2         #python  https://twitter.com/joekadowaki/status/1245108...   \n",
 828 |        "3         #python  https://twitter.com/sheep_0411/status/12578075...   \n",
 829 |        "4         #python  https://twitter.com/joekadowaki/status/1245108...   \n",
 830 |        "...           ...                                                ...   \n",
 831 |        "5270      #python  https://twitter.com/Kuno39962216/status/124511...   \n",
 832 |        "5271      #python  https://twitter.com/BASEBALLY15/status/1245109...   \n",
 833 |        "5272      #python  https://twitter.com/joekadowaki/status/1245109...   \n",
 834 |        "5273      #python  https://twitter.com/joekadowaki/status/1245109...   \n",
 835 |        "5274      #python  https://twitter.com/joekadowaki/status/1245109...   \n",
 836 |        "\n",
 837 |        "                                                   post  \\\n",
 838 |        "0     ｢仕事のムダ｣を省くための、コミュニケーションに関する2つのポイント\\nhttps://t....   \n",
 839 |        "1     LINEの半bot、保護botのソースや\\nPythonista3の使い方\\nソースの書き方...   \n",
 840 |        "2     「ビジネスメール詐欺の実態調査報告書」を公開　JPCERT/CC\\nhttps://t.co...   \n",
 841 |        "3     日経平均\\n2020年05月01日の終値：19,619.35円\\n(前日比-2.84%)\\n...   \n",
 842 |        "4     ライス大学研究チーム、GPUを使わずにディープラーニングを高速化するアルゴリズムを開発\\nh...   \n",
 843 |        "...                                                 ...   \n",
 844 |        "5270  2020年4月1日学習\\n・Udemy 【世界で5万人が受講】実践 Pythonデータサイエ...   \n",
 845 |        "5271  #今日の積み上げ\\n今日も頑張りましょう😊\\n\\n▶️ #Python ブログ執筆\\n▶️ ...   \n",
 846 |        "5272  リモートワークで疲弊する人へ｜この際、生産性は忘れよう\\nhttps://t.co/mJnU...   \n",
 847 |        "5273  地頭のいい人≠アイデアマン。｢問題解決｣への最短距離のつくり方\\nhttps://t.co/...   \n",
 848 |        "5274  オンライン会議を生かす、スムーズな進め方と注意点\\nhttps://t.co/w88CTnb...   \n",
 849 |        "\n",
 850 |        "                        user     post_time  \\\n",
 851 |        "0                        じょー           NaN   \n",
 852 |        "1     U&I iryuSale LINEbot販売  1.588720e+09   \n",
 853 |        "2                        じょー           NaN   \n",
 854 |        "3                        シープ  1.588720e+09   \n",
 855 |        "4                        じょー           NaN   \n",
 856 |        "...                      ...           ...   \n",
 857 |        "5270            kuno&pandapi           NaN   \n",
 858 |        "5271    ゆうき@Python＋C💻ブログで発信📝           NaN   \n",
 859 |        "5272                     じょー           NaN   \n",
 860 |        "5273                     じょー           NaN   \n",
 861 |        "5274                     じょー           NaN   \n",
 862 |        "\n",
 863 |        "                                               hashtags  hashtag_len  \n",
 864 |        "0                     python technology 駆け出しエンジニアと繋がりたい            3  \n",
 865 |        "1     半bot プログラミング pythonista 保護bot linebot python p...            8  \n",
 866 |        "2                     python technology 駆け出しエンジニアと繋がりたい            3  \n",
 867 |        "3                                heroku bot python 日経平均            4  \n",
 868 |        "4                     python technology 駆け出しエンジニアと繋がりたい            3  \n",
 869 |        "...                                                 ...          ...  \n",
 870 |        "5270                              udemy python データサイエンス            3  \n",
 871 |        "5271                     今日の積み上げ python 駆け出しエンジニアと繋がりたい            3  \n",
 872 |        "5272                  python technology 駆け出しエンジニアと繋がりたい            3  \n",
 873 |        "5273                  python technology 駆け出しエンジニアと繋がりたい            3  \n",
 874 |        "5274                  python technology 駆け出しエンジニアと繋がりたい            3  \n",
 875 |        "\n",
 876 |        "[5275 rows x 7 columns]"
 877 |       ]
 878 |      },
 879 |      "execution_count": 17,
 880 |      "metadata": {},
 881 |      "output_type": "execute_result"
 882 |     }
 883 |    ],
 884 |    "source": [
 885 |     "df4"
 886 |    ]
 887 |   },
 888 |   {
 889 |    "cell_type": "code",
 890 |    "execution_count": 23,
 891 |    "metadata": {},
 892 |    "outputs": [],
 893 |    "source": [
 894 |     "cols = ['searched_for', 'hashtags', 'hashtag_len']\n",
 895 |     "df1 = df1[cols]\n",
 896 |     "df2 = df2[cols]\n",
 897 |     "df3 = df3[cols]\n",
 898 |     "df4 = df4[cols]"
 899 |    ]
 900 |   },
 901 |   {
 902 |    "cell_type": "code",
 903 |    "execution_count": 24,
 904 |    "metadata": {},
 905 |    "outputs": [],
 906 |    "source": [
 907 |     "df = pd.concat([df1, df2], axis=0)\n",
 908 |     "df = pd.concat([df, df3], axis=0)\n",
 909 |     "df = pd.concat([df, df4], axis=0)"
 910 |    ]
 911 |   },
 912 |   {
 913 |    "cell_type": "code",
 914 |    "execution_count": 28,
 915 |    "metadata": {},
 916 |    "outputs": [
 917 |     {
 918 |      "data": {
 919 |       "text/html": [
 920 |        "<div>\n",
 921 |        "<style scoped>\n",
 922 |        "    .dataframe tbody tr th:only-of-type {\n",
 923 |        "        vertical-align: middle;\n",
 924 |        "    }\n",
 925 |        "\n",
 926 |        "    .dataframe tbody tr th {\n",
 927 |        "        vertical-align: top;\n",
 928 |        "    }\n",
 929 |        "\n",
 930 |        "    .dataframe thead th {\n",
 931 |        "        text-align: right;\n",
 932 |        "    }\n",
 933 |        "</style>\n",
 934 |        "<table border=\"1\" class=\"dataframe\">\n",
 935 |        "  <thead>\n",
 936 |        "    <tr style=\"text-align: right;\">\n",
 937 |        "      <th></th>\n",
 938 |        "      <th>searched_for</th>\n",
 939 |        "      <th>hashtags</th>\n",
 940 |        "      <th>hashtag_len</th>\n",
 941 |        "    </tr>\n",
 942 |        "  </thead>\n",
 943 |        "  <tbody>\n",
 944 |        "    <tr>\n",
 945 |        "      <th>5643</th>\n",
 946 |        "      <td>#人工知能</td>\n",
 947 |        "      <td>トルコ ドローン 神風ドローン 顔認証 ai drone 人工知能</td>\n",
 948 |        "      <td>7</td>\n",
 949 |        "    </tr>\n",
 950 |        "    <tr>\n",
 951 |        "      <th>2944</th>\n",
 952 |        "      <td>#python</td>\n",
 953 |        "      <td>駆け出しエンジニアとつながりたい python プログラミング初心者</td>\n",
 954 |        "      <td>3</td>\n",
 955 |        "    </tr>\n",
 956 |        "    <tr>\n",
 957 |        "      <th>210</th>\n",
 958 |        "      <td>#kaggle</td>\n",
 959 |        "      <td>kaggle 機械学習 データサイエンティスト</td>\n",
 960 |        "      <td>3</td>\n",
 961 |        "    </tr>\n",
 962 |        "    <tr>\n",
 963 |        "      <th>2115</th>\n",
 964 |        "      <td>#python</td>\n",
 965 |        "      <td>駆け出しエンジニアと繋がりたい プログラミング python プログラミング学習 プログラミ...</td>\n",
 966 |        "      <td>5</td>\n",
 967 |        "    </tr>\n",
 968 |        "    <tr>\n",
 969 |        "      <th>1275</th>\n",
 970 |        "      <td>#データサイエンティスト</td>\n",
 971 |        "      <td>統計学 統計学専攻 データサイエンティスト 統計 外資系 外資系企業</td>\n",
 972 |        "      <td>6</td>\n",
 973 |        "    </tr>\n",
 974 |        "    <tr>\n",
 975 |        "      <th>...</th>\n",
 976 |        "      <td>...</td>\n",
 977 |        "      <td>...</td>\n",
 978 |        "      <td>...</td>\n",
 979 |        "    </tr>\n",
 980 |        "    <tr>\n",
 981 |        "      <th>1666</th>\n",
 982 |        "      <td>#python</td>\n",
 983 |        "      <td>python 機械学習 回帰分析</td>\n",
 984 |        "      <td>3</td>\n",
 985 |        "    </tr>\n",
 986 |        "    <tr>\n",
 987 |        "      <th>6165</th>\n",
 988 |        "      <td>#人工知能</td>\n",
 989 |        "      <td>makeinglandscape deeplearning nowlearning ai g...</td>\n",
 990 |        "      <td>6</td>\n",
 991 |        "    </tr>\n",
 992 |        "    <tr>\n",
 993 |        "      <th>5210</th>\n",
 994 |        "      <td>#python</td>\n",
 995 |        "      <td>オホーツク fswebcam python イマソラ 北海道 photo raspberrypi</td>\n",
 996 |        "      <td>7</td>\n",
 997 |        "    </tr>\n",
 998 |        "    <tr>\n",
 999 |        "      <th>873</th>\n",
1000 |        "      <td>#人工知能</td>\n",
1001 |        "      <td>ai 人工知能</td>\n",
1002 |        "      <td>2</td>\n",
1003 |        "    </tr>\n",
1004 |        "    <tr>\n",
1005 |        "      <th>3881</th>\n",
1006 |        "      <td>#人工知能</td>\n",
1007 |        "      <td>セルフブランディング ai ルーチンワーク 人工知能</td>\n",
1008 |        "      <td>4</td>\n",
1009 |        "    </tr>\n",
1010 |        "  </tbody>\n",
1011 |        "</table>\n",
1012 |        "<p>100 rows × 3 columns</p>\n",
1013 |        "</div>"
1014 |       ],
1015 |       "text/plain": [
1016 |        "      searched_for                                           hashtags  \\\n",
1017 |        "5643         #人工知能                  トルコ ドローン 神風ドローン 顔認証 ai drone 人工知能   \n",
1018 |        "2944       #python                 駆け出しエンジニアとつながりたい python プログラミング初心者   \n",
1019 |        "210        #kaggle                            kaggle 機械学習 データサイエンティスト   \n",
1020 |        "2115       #python  駆け出しエンジニアと繋がりたい プログラミング python プログラミング学習 プログラミ...   \n",
1021 |        "1275  #データサイエンティスト                 統計学 統計学専攻 データサイエンティスト 統計 外資系 外資系企業   \n",
1022 |        "...            ...                                                ...   \n",
1023 |        "1666       #python                                   python 機械学習 回帰分析   \n",
1024 |        "6165         #人工知能  makeinglandscape deeplearning nowlearning ai g...   \n",
1025 |        "5210       #python   オホーツク fswebcam python イマソラ 北海道 photo raspberrypi   \n",
1026 |        "873          #人工知能                                            ai 人工知能   \n",
1027 |        "3881         #人工知能                         セルフブランディング ai ルーチンワーク 人工知能   \n",
1028 |        "\n",
1029 |        "      hashtag_len  \n",
1030 |        "5643            7  \n",
1031 |        "2944            3  \n",
1032 |        "210             3  \n",
1033 |        "2115            5  \n",
1034 |        "1275            6  \n",
1035 |        "...           ...  \n",
1036 |        "1666            3  \n",
1037 |        "6165            6  \n",
1038 |        "5210            7  \n",
1039 |        "873             2  \n",
1040 |        "3881            4  \n",
1041 |        "\n",
1042 |        "[100 rows x 3 columns]"
1043 |       ]
1044 |      },
1045 |      "execution_count": 28,
1046 |      "metadata": {},
1047 |      "output_type": "execute_result"
1048 |     }
1049 |    ],
1050 |    "source": [
1051 |     "df.sample(100)"
1052 |    ]
1053 |   },
1054 |   {
1055 |    "cell_type": "code",
1056 |    "execution_count": 26,
1057 |    "metadata": {},
1058 |    "outputs": [],
1059 |    "source": [
1060 |     "df.to_csv('twitter_post.csv', index=False)"
1061 |    ]
1062 |   },
1063 |   {
1064 |    "cell_type": "code",
1065 |    "execution_count": null,
1066 |    "metadata": {},
1067 |    "outputs": [],
1068 |    "source": []
1069 |   }
1070 |  ],
1071 |  "metadata": {
1072 |   "kernelspec": {
1073 |    "display_name": "Python 3",
1074 |    "language": "python",
1075 |    "name": "python3"
1076 |   },
1077 |   "language_info": {
1078 |    "codemirror_mode": {
1079 |     "name": "ipython",
1080 |     "version": 3
1081 |    },
1082 |    "file_extension": ".py",
1083 |    "mimetype": "text/x-python",
1084 |    "name": "python",
1085 |    "nbconvert_exporter": "python",
1086 |    "pygments_lexer": "ipython3",
1087 |    "version": "3.7.2"
1088 |   }
1089 |  },
1090 |  "nbformat": 4,
1091 |  "nbformat_minor": 4
1092 | }
1093 | 


--------------------------------------------------------------------------------
/nlp/twitter_analytics_using_nlplot/wordcloud.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/takapy0210/geek_blog/e36604f01d26f4d14bdacc6bb2995c929d49fdfa/nlp/twitter_analytics_using_nlplot/wordcloud.png


--------------------------------------------------------------------------------
/other/hatenablog_css/design.css:
--------------------------------------------------------------------------------
  1 | /* <system section="theme" selected="8599973812270629022"> */
  2 | @import "https://blog.hatena.ne.jp/-/theme/8599973812270629022.css";
  3 | 
  4 | /* ブログタイトル文字サイズ変更 */
  5 | @media screen and (max-width: 640px){
  6 |     #blog-title #title {
  7 |         font-size: 20px !important;
  8 |     }
  9 | }
 10 | 
 11 | /* タイトル下のブログ説明部分 (設定 > 基本設定 > ブログの説明) */
 12 | h2#blog-description {
 13 |     font-size: 12px !important;  /* 文字サイズ変更 */
 14 |     margin: 1px;  /* 上下左右に余白追加 */
 15 | }
 16 | 
 17 | /* 【タブレット、PC限定】 */
 18 | @media screen and (min-width:641px) {
 19 |     h2#blog-description {
 20 |         font-size: 18px !important;  /* 文字サイズ変更 */
 21 |         margin: 5px;  /* 上下左右に余白追加 */
 22 |     }
 23 | }
 24 | 
 25 | /* </system> */
 26 | 
 27 | /* ### ヘッダーの背景色 ### */
 28 | #blog-title{
 29 |   background: #f8f8ff !important;
 30 | }
 31 | /* ### ブログタイトルの文字色 ### */
 32 | #title a{
 33 |   color: #カラーコード !important;
 34 | }
 35 | /* ### ブログ説明の文字色 ### */
 36 | #blog-description{
 37 |   color: #カラーコード !important;
 38 | }
 39 | 
 40 | /*
 41 | 枠 (div) の設定 (画面幅、境界線、背景色)
 42 | -------------------------------------------------------*/
 43 | /* 【タブレット、PC限定】 */
 44 | @media screen and (min-width:641px) {
 45 |     /* 左右の余白を削除 */
 46 |     #container {
 47 |         width: 80%;  /* 本文エリアとサイドバー含めて画面いっぱいに広げる */
 48 |     }
 49 | 
 50 |     /* 本文エリア全体 */
 51 |     #main {
 52 |         background-color: #ffffff;  /* 本文エリアの背景色 */
 53 |         /*border: 1px solid #bde6f2;*/  /* 本文エリアの枠線 */
 54 |         border-radius: 5px; /* 角を丸くする */
 55 |         float: left;  /* サイドバーをfloat leftにするため */
 56 |         margin: 30px 2% 0 8%;
 57 |         padding: 30px;  /* 本文エリアの文字と枠線の間の余白 */
 58 |         width: 50%; /* 画面幅50% */
 59 |     }
 60 | 
 61 |     /* サイドバー */
 62 |     #box2 {
 63 |         float: left;  /* 本文エリアの方に詰める */
 64 |         margin: 30px 3% 0 2%;
 65 |         width: 22%; /* 画面幅22% 画面拡大しても崩れにくいよう余裕持たせてます */
 66 |     }
 67 | }
 68 | 
 69 | /*
 70 | 基本的なフォント設定 (見出しの設定は、「記事エリアの設定」で行う)
 71 | -------------------------------------------------------*/
 72 | /* 全体のフォントファミリー指定 */
 73 | /* ★ WEBフォントの追加設定 */
 74 | .entry-content, .entry-title, body {
 75 |     font-family: 'Noto Sans', 'Noto Sans JP', 'Hiragino Kaku Gothic ProN', メイリオ, Meiryo, sans-serif;
 76 |     /*letter-spacing: 0.0005em;*/ /* 字間を0.05字分空けて読みやすくする */
 77 | }
 78 | 
 79 | /*
 80 | 見出しの設定
 81 | -------------------------------------------------------*/
 82 | /* 記事タイトルのフォント */
 83 | h1.entry-title a {
 84 |     font-size: 15px;
 85 | }
 86 | 
 87 | /* 【タブレット、PC限定】 */
 88 | @media screen and (min-width:641px) {
 89 |     h1.entry-title a {
 90 |     font-size: 22px;
 91 |     }
 92 | }
 93 | 
 94 | /* 見出し1の設定 */
 95 | .entry-content h1 {
 96 |     padding: 0.6em 0.6em;/*上下 左右の余白*/
 97 |     border-left: solid 2.5px #ffa8a8;/*左線*/
 98 |     font-size: 22px;
 99 |     background: #f9fcff;/*背景色*/
100 |     /*padding: 10px 20px 15px 20px;*/
101 | }
102 | 
103 | /* 見出し2の設定 */
104 | .entry-content h2 {
105 |     padding: 0.2em 0.4em;/*上下 左右の余白*/
106 |     color: #494949;/*文字色*/
107 |     background: transparent;/*背景透明に*/
108 |     border-bottom: solid 1.5px #d3d3d3;
109 |     font-size: 20px;
110 | }
111 | 
112 | /* 見出し3の設定 */
113 | .entry-content h3 {
114 |     padding: 0.2em 0.2em;/*上下 左右の余白*/
115 |     color: #494949;/*文字色*/
116 |     font-size: 18px;
117 | }
118 | 
119 | /*
120 | 強調文字列部分の設定 (マークダウンでいう右記の部分： ** 文字列 **)
121 | -------------------------------------------------------*/
122 | /* 蛍光ペンの設定 */
123 | /* (補足) rgbaの4番目の引数は透明度を表す。0で透明、1で完全に塗りつぶす。transparentは一部ブラウザで黒と解釈されるので使わない */
124 | /* (補足) 60%の数値を両方増やすと蛍光ペンが細くなる。両方減らすと太くなる */
125 | /* (補足) 前半を20%、後半を80%とすると、上から20%の位置を透明、80%の位置を色付きとし、間はグラデーションになる */
126 | /* ■蛍光ペンのデザイン：https://naifix.com/strong-css-sample/ */
127 | .entry-content strong {
128 |     background: linear-gradient(rgba(246, 210, 139, 0) 60%, rgba(246, 210, 139, 1) 60%);  
129 |     border-radius: 2px; /* 角を丸める */
130 | }
131 | 
132 | 
133 | /* 行間の設定 */
134 | /*.entry-content p {margin:0.1}*/
135 | .entry-content p{ 
136 | line-height: 1.8em; /* 行間の幅調整*/
137 | letter-spacing:0.4pt; /* 文字の間隔調整*/
138 | /*font-size:15px;*/
139 | }  
140 | 
141 | /*
142 | 目次の設定
143 | -------------------------------------------------------*/
144 | /* 見出し1に対応する目次の余白調整、および自動採番用の変数セット */
145 | ul.table-of-contents > li {
146 |     margin-top: 0.1em;
147 |     list-style-type: none;
148 |     counter-increment: mokuji-1; /* mokuji-1という変数に1を足す */
149 |     counter-reset: mokuji-2; /* mokuji-2という変数の値を0に戻す */
150 |     line-height:132%;
151 | }
152 | 
153 | /* 見出し1に対応する目次の自動採番 */
154 | ul.table-of-contents > li::before{
155 |     content: counter(mokuji-1) ". "; /* 文字列挿入。"1. " のような形式 */
156 | }
157 | 
158 | /* 見出し2に対応する目次の余白調整、および自動採番用の変数セット */
159 | ul.table-of-contents ul > li {
160 |     list-style-type: none;
161 |     margin-top: 0;
162 |     counter-increment: mokuji-2;
163 |     line-height:132%;
164 | }
165 | 
166 | /* 見出し2に対応する目次の自動採番 */
167 | ul.table-of-contents ul > li::before {
168 |     content: counter(mokuji-1) "." counter(mokuji-2) ". "; /* 文字列挿入。"1.1. " のような形式 */
169 | }
170 | 
171 | /* 見出し3以降に対応する目次を非表示にする */
172 | ul.table-of-contents ul ul { 
173 |     display: none;
174 |     line-height:132%;
175 | }
176 | 
177 | .entry-content .table-of-contents {
178 |     /*margin: 2em 2em;*/ /*目次上下の余白*/
179 |     padding: 3em 0 2em 2em; /*目次下内部余白 上,右,下,左*/
180 |     /*margin: 0 0 0 3.5em;*/ /*左側余白*/
181 |     /*padding: 0.01em 0 0 0 !important;*/ /*行間余白*/
182 |     /*border: 1px solid #ddd;*/ /*枠線のスタイル*/
183 |     /*background-color: #fff;*/ /*目次内背景色*/
184 |     /*font-size: 0.95em;*/ /*文字サイズ*/
185 |     /*font-weight: normal;*/ /*文字太さ*/
186 |     border-radius: 5px; /*角を丸める*/
187 | }
188 | 
189 | ul.table-of-contents > li a:link{
190 |   color:#ad8383; /*色はここを変更*/
191 | 　text-decoration: none;
192 | }
193 | 
194 | .entry-content .table-of-contents a:link{
195 | 　color:#ad8383; /*色はここを変更*/
196 | 　text-decoration: none;
197 | }
198 | 
199 | ul.table-of-contents > li a:visited{
200 |   color:#8c6a6a; /*色はここを変更*/
201 | }
202 | 
203 | .entry-content .table-of-contents a:visited{
204 | 　color: #8c6a6a; /*色はここを変更*/
205 | }
206 | 
207 | .entry-content .table-of-contents a:hover{
208 | 　text-decoration:underline; /*下線をつける*/
209 | }
210 | 
211 | /*
212 | ソースコードのシンタックスハイライト (Syntax Highlighting) の書式
213 | -------------------------------------------------------*/
214 | /* 文字サイズ変更 */
215 | .entry-content pre.code {
216 |    font-size:90%;
217 |    line-height:150%;
218 | }
219 | 
220 | /* コードの背景色変更 */
221 | .entry-content pre.code {
222 |     background-color: #3F3F3F;
223 |     color: #DCDCDC;
224 | }
225 | /*
226 | pre.code ol{
227 |   margin-top: 0;
228 |   margin-bottom: 0;
229 | }
230 | pre.code .code-list{
231 |   border-left: 1px solid #999999; *縦線*
232 |   padding-left:6px;
233 | }
234 | pre.code .code-list:nth-child(2n+1) {
235 |     background-color: #424242; *奇数行の背景色*
236 | }
237 | */
238 | .synSpecial { color: #cc9393; }
239 | .synType { color: #E3CEAB; }
240 | .synComment { color: #7A987A; }
241 | .synPreProc { color: #8c8cb4; }
242 | .synIdentifier { color: #6e96be; }
243 | .synConstant { color: #cc9393; }
244 | .synStatement { color: #efc986; }
245 | 
246 | 
247 | /*
248 | 追尾する目次
249 | -------------------------------------------------------*/
250 | #stoc-module {
251 |   backface-visibility: hidden;
252 | }
253 | #stoc-module.tracking {
254 |   margin-bottom: 0;
255 | }
256 | #stoc-module.fixed {
257 |   position: fixed;
258 | }
259 | #stoc-module.absolute {
260 |   position: absolute;
261 | }
262 | #stoc-module.sticky {
263 |   position: -webkit-sticky;
264 |   position: sticky;
265 | }
266 | #stoc-module.fade-in {
267 |   animation: fadeIn 300ms;
268 | }
269 | @keyframes fadeIn {
270 |   0% {opacity: 0}
271 |   100% {opacity: 1}
272 | }
273 | 
274 | #stoc {
275 |   overflow-y: auto;
276 | }
277 | #stoc.shadow {
278 |   /* Shadows */
279 |   background:
280 |     radial-gradient(farthest-side at top, rgba(0,0,0,.17), transparent) top / 100% 11px,
281 |     radial-gradient(farthest-side at bottom, rgba(0,0,0,.17), transparent) bottom / 100% 11px;
282 |   background-repeat: no-repeat;
283 |   background-attachment: scroll;
284 | }
285 | #stoc ol {
286 |   margin: 0;
287 |   padding: 0 0 0 1em;
288 |   list-style-type: none;
289 | }
290 | #stoc > ol {
291 |   padding-left: 0;
292 | }
293 | #stoc.shadow > ol {
294 |   /* Shadow covers */
295 |   background:
296 |     linear-gradient(#fff 30%, transparent) top / 100% 40px,
297 |     linear-gradient(transparent, #fff 70%) bottom / 100% 40px;
298 |   background-repeat: no-repeat;
299 |   background-attachment: local;
300 | }
301 | #stoc a {
302 |   padding: 2px 2px 2px 6px;
303 |   display: block;
304 |   text-decoration: none;
305 | }
306 | #stoc:not(.touch) a:hover {
307 |   background-color: rgba(0,0,0,.04);
308 |   text-decoration: underline;
309 | }
310 | #stoc .active {
311 |   background-color: rgba(0,0,0,.04);
312 | }
313 | 
314 | #stoc::-webkit-scrollbar {
315 |   width: 8px;
316 |   background: #ececec;
317 | }
318 | #stoc::-webkit-scrollbar-button {
319 |   display: none;
320 | }
321 | #stoc::-webkit-scrollbar-thumb {
322 |   background: #b1b1b1;
323 | }
324 | 
325 | 
326 | /*
327 | Categoryをタイル表示に変更（Innocent）
328 | うまく動かない
329 | -------------------------------------------------------*/
330 | /*
331 | .hatena-module-category .hatena-urllist {
332 |  margin: 0 0 -6px;
333 |  padding: 0;
334 | }
335 | .hatena-module-category .hatena-urllist li::before {
336 |  content: none;
337 | }
338 | .hatena-module-category .hatena-urllist li {
339 |  border-top: 0;
340 |  display: block;
341 |  float: left;
342 |  margin: 0 6px 6px 0;
343 |  padding: 0;
344 | }
345 | .hatena-module-category .hatena-urllist li a {
346 |  border: 1px solid #e6e6e6;
347 |  border-radius: 2px;
348 |  display: block;
349 |  font-size: 0.8667em;
350 |  line-height: 32px;
351 |  padding: 0 12px;
352 | }
353 | .hatena-module-category .hatena-urllist li a:hover {
354 |  background-color: #f6f6f6;
355 |  color: #333;
356 | }
357 | */


--------------------------------------------------------------------------------
/recommendation/graph/ml-latest-small/README.txt:
--------------------------------------------------------------------------------
  1 | Summary
  2 | =======
  3 | 
  4 | This dataset (ml-latest-small) describes 5-star rating and free-text tagging activity from [MovieLens](http://movielens.org), a movie recommendation service. It contains 100836 ratings and 3683 tag applications across 9742 movies. These data were created by 610 users between March 29, 1996 and September 24, 2018. This dataset was generated on September 26, 2018.
  5 | 
  6 | Users were selected at random for inclusion. All selected users had rated at least 20 movies. No demographic information is included. Each user is represented by an id, and no other information is provided.
  7 | 
  8 | The data are contained in the files `links.csv`, `movies.csv`, `ratings.csv` and `tags.csv`. More details about the contents and use of all these files follows.
  9 | 
 10 | This is a *development* dataset. As such, it may change over time and is not an appropriate dataset for shared research results. See available *benchmark* datasets if that is your intent.
 11 | 
 12 | This and other GroupLens data sets are publicly available for download at <http://grouplens.org/datasets/>.
 13 | 
 14 | 
 15 | Usage License
 16 | =============
 17 | 
 18 | Neither the University of Minnesota nor any of the researchers involved can guarantee the correctness of the data, its suitability for any particular purpose, or the validity of results based on the use of the data set. The data set may be used for any research purposes under the following conditions:
 19 | 
 20 | * The user may not state or imply any endorsement from the University of Minnesota or the GroupLens Research Group.
 21 | * The user must acknowledge the use of the data set in publications resulting from the use of the data set (see below for citation information).
 22 | * The user may redistribute the data set, including transformations, so long as it is distributed under these same license conditions.
 23 | * The user may not use this information for any commercial or revenue-bearing purposes without first obtaining permission from a faculty member of the GroupLens Research Project at the University of Minnesota.
 24 | * The executable software scripts are provided "as is" without warranty of any kind, either expressed or implied, including, but not limited to, the implied warranties of merchantability and fitness for a particular purpose. The entire risk as to the quality and performance of them is with you. Should the program prove defective, you assume the cost of all necessary servicing, repair or correction.
 25 | 
 26 | In no event shall the University of Minnesota, its affiliates or employees be liable to you for any damages arising out of the use or inability to use these programs (including but not limited to loss of data or data being rendered inaccurate).
 27 | 
 28 | If you have any further questions or comments, please email <grouplens-info@umn.edu>
 29 | 
 30 | 
 31 | Citation
 32 | ========
 33 | 
 34 | To acknowledge use of the dataset in publications, please cite the following paper:
 35 | 
 36 | > F. Maxwell Harper and Joseph A. Konstan. 2015. The MovieLens Datasets: History and Context. ACM Transactions on Interactive Intelligent Systems (TiiS) 5, 4: 19:1–19:19. <https://doi.org/10.1145/2827872>
 37 | 
 38 | 
 39 | Further Information About GroupLens
 40 | ===================================
 41 | 
 42 | GroupLens is a research group in the Department of Computer Science and Engineering at the University of Minnesota. Since its inception in 1992, GroupLens's research projects have explored a variety of fields including:
 43 | 
 44 | * recommender systems
 45 | * online communities
 46 | * mobile and ubiquitious technologies
 47 | * digital libraries
 48 | * local geographic information systems
 49 | 
 50 | GroupLens Research operates a movie recommender based on collaborative filtering, MovieLens, which is the source of these data. We encourage you to visit <http://movielens.org> to try it out! If you have exciting ideas for experimental work to conduct on MovieLens, send us an email at <grouplens-info@cs.umn.edu> - we are always interested in working with external collaborators.
 51 | 
 52 | 
 53 | Content and Use of Files
 54 | ========================
 55 | 
 56 | Formatting and Encoding
 57 | -----------------------
 58 | 
 59 | The dataset files are written as [comma-separated values](http://en.wikipedia.org/wiki/Comma-separated_values) files with a single header row. Columns that contain commas (`,`) are escaped using double-quotes (`"`). These files are encoded as UTF-8. If accented characters in movie titles or tag values (e.g. Misérables, Les (1995)) display incorrectly, make sure that any program reading the data, such as a text editor, terminal, or script, is configured for UTF-8.
 60 | 
 61 | 
 62 | User Ids
 63 | --------
 64 | 
 65 | MovieLens users were selected at random for inclusion. Their ids have been anonymized. User ids are consistent between `ratings.csv` and `tags.csv` (i.e., the same id refers to the same user across the two files).
 66 | 
 67 | 
 68 | Movie Ids
 69 | ---------
 70 | 
 71 | Only movies with at least one rating or tag are included in the dataset. These movie ids are consistent with those used on the MovieLens web site (e.g., id `1` corresponds to the URL <https://movielens.org/movies/1>). Movie ids are consistent between `ratings.csv`, `tags.csv`, `movies.csv`, and `links.csv` (i.e., the same id refers to the same movie across these four data files).
 72 | 
 73 | 
 74 | Ratings Data File Structure (ratings.csv)
 75 | -----------------------------------------
 76 | 
 77 | All ratings are contained in the file `ratings.csv`. Each line of this file after the header row represents one rating of one movie by one user, and has the following format:
 78 | 
 79 |     userId,movieId,rating,timestamp
 80 | 
 81 | The lines within this file are ordered first by userId, then, within user, by movieId.
 82 | 
 83 | Ratings are made on a 5-star scale, with half-star increments (0.5 stars - 5.0 stars).
 84 | 
 85 | Timestamps represent seconds since midnight Coordinated Universal Time (UTC) of January 1, 1970.
 86 | 
 87 | 
 88 | Tags Data File Structure (tags.csv)
 89 | -----------------------------------
 90 | 
 91 | All tags are contained in the file `tags.csv`. Each line of this file after the header row represents one tag applied to one movie by one user, and has the following format:
 92 | 
 93 |     userId,movieId,tag,timestamp
 94 | 
 95 | The lines within this file are ordered first by userId, then, within user, by movieId.
 96 | 
 97 | Tags are user-generated metadata about movies. Each tag is typically a single word or short phrase. The meaning, value, and purpose of a particular tag is determined by each user.
 98 | 
 99 | Timestamps represent seconds since midnight Coordinated Universal Time (UTC) of January 1, 1970.
100 | 
101 | 
102 | Movies Data File Structure (movies.csv)
103 | ---------------------------------------
104 | 
105 | Movie information is contained in the file `movies.csv`. Each line of this file after the header row represents one movie, and has the following format:
106 | 
107 |     movieId,title,genres
108 | 
109 | Movie titles are entered manually or imported from <https://www.themoviedb.org/>, and include the year of release in parentheses. Errors and inconsistencies may exist in these titles.
110 | 
111 | Genres are a pipe-separated list, and are selected from the following:
112 | 
113 | * Action
114 | * Adventure
115 | * Animation
116 | * Children's
117 | * Comedy
118 | * Crime
119 | * Documentary
120 | * Drama
121 | * Fantasy
122 | * Film-Noir
123 | * Horror
124 | * Musical
125 | * Mystery
126 | * Romance
127 | * Sci-Fi
128 | * Thriller
129 | * War
130 | * Western
131 | * (no genres listed)
132 | 
133 | 
134 | Links Data File Structure (links.csv)
135 | ---------------------------------------
136 | 
137 | Identifiers that can be used to link to other sources of movie data are contained in the file `links.csv`. Each line of this file after the header row represents one movie, and has the following format:
138 | 
139 |     movieId,imdbId,tmdbId
140 | 
141 | movieId is an identifier for movies used by <https://movielens.org>. E.g., the movie Toy Story has the link <https://movielens.org/movies/1>.
142 | 
143 | imdbId is an identifier for movies used by <http://www.imdb.com>. E.g., the movie Toy Story has the link <http://www.imdb.com/title/tt0114709/>.
144 | 
145 | tmdbId is an identifier for movies used by <https://www.themoviedb.org>. E.g., the movie Toy Story has the link <https://www.themoviedb.org/movie/862>.
146 | 
147 | Use of the resources listed above is subject to the terms of each provider.
148 | 
149 | 
150 | Cross-Validation
151 | ----------------
152 | 
153 | Prior versions of the MovieLens dataset included either pre-computed cross-folds or scripts to perform this computation. We no longer bundle either of these features with the dataset, since most modern toolkits provide this as a built-in feature. If you wish to learn about standard approaches to cross-fold computation in the context of recommender systems evaluation, see [LensKit](http://lenskit.org) for tools, documentation, and open-source code examples.
154 | 


--------------------------------------------------------------------------------
/recommendation/matrix_factorization/data/ml-25m/README.txt:
--------------------------------------------------------------------------------
  1 | Summary
  2 | =======
  3 | 
  4 | This dataset (ml-25m) describes 5-star rating and free-text tagging activity from [MovieLens](http://movielens.org), a movie recommendation service. It contains 25000095 ratings and 1093360 tag applications across 62423 movies. These data were created by 162541 users between January 09, 1995 and November 21, 2019. This dataset was generated on November 21, 2019.
  5 | 
  6 | Users were selected at random for inclusion. All selected users had rated at least 20 movies. No demographic information is included. Each user is represented by an id, and no other information is provided.
  7 | 
  8 | The data are contained in the files `genome-scores.csv`, `genome-tags.csv`, `links.csv`, `movies.csv`, `ratings.csv` and `tags.csv`. More details about the contents and use of all these files follows.
  9 | 
 10 | This and other GroupLens data sets are publicly available for download at <http://grouplens.org/datasets/>.
 11 | 
 12 | 
 13 | Usage License
 14 | =============
 15 | 
 16 | Neither the University of Minnesota nor any of the researchers involved can guarantee the correctness of the data, its suitability for any particular purpose, or the validity of results based on the use of the data set. The data set may be used for any research purposes under the following conditions:
 17 | 
 18 | * The user may not state or imply any endorsement from the University of Minnesota or the GroupLens Research Group.
 19 | * The user must acknowledge the use of the data set in publications resulting from the use of the data set (see below for citation information).
 20 | * The user may not redistribute the data without separate permission.
 21 | * The user may not use this information for any commercial or revenue-bearing purposes without first obtaining permission from a faculty member of the GroupLens Research Project at the University of Minnesota.
 22 | * The executable software scripts are provided "as is" without warranty of any kind, either expressed or implied, including, but not limited to, the implied warranties of merchantability and fitness for a particular purpose. The entire risk as to the quality and performance of them is with you. Should the program prove defective, you assume the cost of all necessary servicing, repair or correction.
 23 | 
 24 | In no event shall the University of Minnesota, its affiliates or employees be liable to you for any damages arising out of the use or inability to use these programs (including but not limited to loss of data or data being rendered inaccurate).
 25 | 
 26 | If you have any further questions or comments, please email <grouplens-info@umn.edu>
 27 | 
 28 | 
 29 | Citation
 30 | ========
 31 | 
 32 | To acknowledge use of the dataset in publications, please cite the following paper:
 33 | 
 34 | > F. Maxwell Harper and Joseph A. Konstan. 2015. The MovieLens Datasets: History and Context. ACM Transactions on Interactive Intelligent Systems (TiiS) 5, 4: 19:1–19:19. <https://doi.org/10.1145/2827872>
 35 | 
 36 | 
 37 | Further Information About GroupLens
 38 | ===================================
 39 | 
 40 | GroupLens is a research group in the Department of Computer Science and Engineering at the University of Minnesota. Since its inception in 1992, GroupLens's research projects have explored a variety of fields including:
 41 | 
 42 | * recommender systems
 43 | * online communities
 44 | * mobile and ubiquitious technologies
 45 | * digital libraries
 46 | * local geographic information systems
 47 | 
 48 | GroupLens Research operates a movie recommender based on collaborative filtering, MovieLens, which is the source of these data. We encourage you to visit <http://movielens.org> to try it out! If you have exciting ideas for experimental work to conduct on MovieLens, send us an email at <grouplens-info@cs.umn.edu> - we are always interested in working with external collaborators.
 49 | 
 50 | 
 51 | Content and Use of Files
 52 | ========================
 53 | 
 54 | Verifying the Dataset Contents
 55 | ------------------------------
 56 | 
 57 | We encourage you to verify that the dataset you have on your computer is identical to the ones hosted at [grouplens.org](http://grouplens.org).  This is an important step if you downloaded the dataset from a location other than [grouplens.org](http://grouplens.org), or if you wish to publish research results based on analysis of the MovieLens dataset.
 58 | 
 59 | We provide a [MD5 checksum](http://en.wikipedia.org/wiki/Md5sum) with the same name as the downloadable `.zip` file, but with a `.md5` file extension. To verify the dataset:
 60 | 
 61 |     # on linux
 62 |     md5sum ml-25m.zip; cat ml-25m.zip.md5
 63 | 
 64 |     # on OSX
 65 |     md5 ml-25m.zip; cat ml-25m.zip.md5
 66 | 
 67 |     # windows users can download a tool from Microsoft (or elsewhere) that verifies MD5 checksums
 68 | 
 69 | Check that the two lines of output contain the same hash value.
 70 | 
 71 | 
 72 | Formatting and Encoding
 73 | -----------------------
 74 | 
 75 | The dataset files are written as [comma-separated values](http://en.wikipedia.org/wiki/Comma-separated_values) files with a single header row. Columns that contain commas (`,`) are escaped using double-quotes (`"`). These files are encoded as UTF-8. If accented characters in movie titles or tag values (e.g. Misérables, Les (1995)) display incorrectly, make sure that any program reading the data, such as a text editor, terminal, or script, is configured for UTF-8.
 76 | 
 77 | 
 78 | User Ids
 79 | --------
 80 | 
 81 | MovieLens users were selected at random for inclusion. Their ids have been anonymized. User ids are consistent between `ratings.csv` and `tags.csv` (i.e., the same id refers to the same user across the two files).
 82 | 
 83 | 
 84 | Movie Ids
 85 | ---------
 86 | 
 87 | Only movies with at least one rating or tag are included in the dataset. These movie ids are consistent with those used on the MovieLens web site (e.g., id `1` corresponds to the URL <https://movielens.org/movies/1>). Movie ids are consistent between `ratings.csv`, `tags.csv`, `movies.csv`, and `links.csv` (i.e., the same id refers to the same movie across these four data files).
 88 | 
 89 | 
 90 | Ratings Data File Structure (ratings.csv)
 91 | -----------------------------------------
 92 | 
 93 | All ratings are contained in the file `ratings.csv`. Each line of this file after the header row represents one rating of one movie by one user, and has the following format:
 94 | 
 95 |     userId,movieId,rating,timestamp
 96 | 
 97 | The lines within this file are ordered first by userId, then, within user, by movieId.
 98 | 
 99 | Ratings are made on a 5-star scale, with half-star increments (0.5 stars - 5.0 stars).
100 | 
101 | Timestamps represent seconds since midnight Coordinated Universal Time (UTC) of January 1, 1970.
102 | 
103 | 
104 | Tags Data File Structure (tags.csv)
105 | -----------------------------------
106 | 
107 | All tags are contained in the file `tags.csv`. Each line of this file after the header row represents one tag applied to one movie by one user, and has the following format:
108 | 
109 |     userId,movieId,tag,timestamp
110 | 
111 | The lines within this file are ordered first by userId, then, within user, by movieId.
112 | 
113 | Tags are user-generated metadata about movies. Each tag is typically a single word or short phrase. The meaning, value, and purpose of a particular tag is determined by each user.
114 | 
115 | Timestamps represent seconds since midnight Coordinated Universal Time (UTC) of January 1, 1970.
116 | 
117 | 
118 | Movies Data File Structure (movies.csv)
119 | ---------------------------------------
120 | 
121 | Movie information is contained in the file `movies.csv`. Each line of this file after the header row represents one movie, and has the following format:
122 | 
123 |     movieId,title,genres
124 | 
125 | Movie titles are entered manually or imported from <https://www.themoviedb.org/>, and include the year of release in parentheses. Errors and inconsistencies may exist in these titles.
126 | 
127 | Genres are a pipe-separated list, and are selected from the following:
128 | 
129 | * Action
130 | * Adventure
131 | * Animation
132 | * Children's
133 | * Comedy
134 | * Crime
135 | * Documentary
136 | * Drama
137 | * Fantasy
138 | * Film-Noir
139 | * Horror
140 | * Musical
141 | * Mystery
142 | * Romance
143 | * Sci-Fi
144 | * Thriller
145 | * War
146 | * Western
147 | * (no genres listed)
148 | 
149 | 
150 | Links Data File Structure (links.csv)
151 | ---------------------------------------
152 | 
153 | Identifiers that can be used to link to other sources of movie data are contained in the file `links.csv`. Each line of this file after the header row represents one movie, and has the following format:
154 | 
155 |     movieId,imdbId,tmdbId
156 | 
157 | movieId is an identifier for movies used by <https://movielens.org>. E.g., the movie Toy Story has the link <https://movielens.org/movies/1>.
158 | 
159 | imdbId is an identifier for movies used by <http://www.imdb.com>. E.g., the movie Toy Story has the link <http://www.imdb.com/title/tt0114709/>.
160 | 
161 | tmdbId is an identifier for movies used by <https://www.themoviedb.org>. E.g., the movie Toy Story has the link <https://www.themoviedb.org/movie/862>.
162 | 
163 | Use of the resources listed above is subject to the terms of each provider.
164 | 
165 | 
166 | Tag Genome (genome-scores.csv and genome-tags.csv)
167 | -------------------------------------------------
168 | 
169 | This data set includes a current copy of the Tag Genome.
170 | 
171 | [genome-paper]: http://files.grouplens.org/papers/tag_genome.pdf
172 | 
173 | The tag genome is a data structure that contains tag relevance scores for movies.  The structure is a dense matrix: each movie in the genome has a value for *every* tag in the genome.
174 | 
175 | As described in [this article][genome-paper], the tag genome encodes how strongly movies exhibit particular properties represented by tags (atmospheric, thought-provoking, realistic, etc.). The tag genome was computed using a machine learning algorithm on user-contributed content including tags, ratings, and textual reviews.
176 | 
177 | The genome is split into two files.  The file `genome-scores.csv` contains movie-tag relevance data in the following format:
178 | 
179 |     movieId,tagId,relevance
180 | 
181 | The second file, `genome-tags.csv`, provides the tag descriptions for the tag IDs in the genome file, in the following format:
182 | 
183 |     tagId,tag
184 | 
185 | The `tagId` values are generated when the data set is exported, so they may vary from version to version of the MovieLens data sets.
186 | 
187 | Please include the following citation if referencing tag genome data:
188 | 
189 | > Jesse Vig, Shilad Sen, and John Riedl. 2012. The Tag Genome: Encoding Community Knowledge to Support Novel Interaction. ACM Trans. Interact. Intell. Syst. 2, 3: 13:1–13:44. <https://doi.org/10.1145/2362394.2362395>
190 | 
191 | 
192 | Cross-Validation
193 | ----------------
194 | 
195 | Prior versions of the MovieLens dataset included either pre-computed cross-folds or scripts to perform this computation. We no longer bundle either of these features with the dataset, since most modern toolkits provide this as a built-in feature. If you wish to learn about standard approaches to cross-fold computation in the context of recommender systems evaluation, see [LensKit](http://lenskit.org) for tools, documentation, and open-source code examples.
196 | 


--------------------------------------------------------------------------------
/streamlit/sample.py:
--------------------------------------------------------------------------------
 1 | import streamlit as st
 2 | import pandas as pd
 3 | import numpy as np
 4 | 
 5 | st.title('streamlitのサンプルだお')
 6 | 
 7 | DATE_COLUMN = 'date/time'
 8 | DATA_URL = ('https://s3-us-west-2.amazonaws.com/'
 9 |          'streamlit-demo-data/uber-raw-data-sep14.csv.gz')
10 | 
11 | 
12 | @st.cache
13 | def load_data(nrows):
14 |     data = pd.read_csv(DATA_URL, nrows=nrows)
15 |     lowercase = lambda x: str(x).lower()
16 |     data.rename(lowercase, axis='columns', inplace=True)
17 |     data[DATE_COLUMN] = pd.to_datetime(data[DATE_COLUMN])
18 |     return data
19 | 
20 | # Create a text element and let the reader know the data is loading.
21 | data_load_state = st.text('Loading data...')
22 | # Load 10,000 rows of data into the dataframe.
23 | data = load_data(10000)
24 | # Notify the reader that the data was successfully loaded.
25 | data_load_state.text('Loading data...done!')
26 | 
27 | if st.checkbox('Show raw data'):
28 |     st.subheader('Raw data')
29 |     st.write(data)
30 | 
31 | 
32 | 
33 | st.subheader('Number of pickups by hour')
34 | hist_values = np.histogram(data[DATE_COLUMN].dt.hour, bins=24, range=(0,24))[0]
35 | st.bar_chart(hist_values)
36 | 
37 | 
38 | 
39 | # Some number in the range 0-23
40 | hour_to_filter = st.slider('hour', 0, 23, 17)
41 | filtered_data = data[data[DATE_COLUMN].dt.hour == hour_to_filter]
42 | 
43 | st.write(hour_to_filter)
44 | 
45 | st.text('This is some text.')
46 | 
47 | #ボタン処理
48 | if st.button('ボタンの処理も作れる'):
49 |     #ボタン押された
50 |     st.write('Why hello there')
51 | else:
52 |     st.write('Goodbye')
53 | 
54 | #テキスト入力欄も作れるよ
55 | st.text_area('labelだお', value="")


--------------------------------------------------------------------------------