├── .travis.yml
├── LICENSE
├── README.md
├── composer.json
├── composer.lock
├── lib
└── TextRank
│ ├── Config.php
│ ├── DefaultEvents.php
│ ├── POS
│ └── English
│ │ ├── Tagger.php
│ │ ├── generate.php
│ │ ├── lexicon.php
│ │ └── lexicon.txt
│ ├── Stopword.php
│ ├── Stopword
│ ├── Stopword.php
│ ├── czech-stopwords.txt
│ ├── danish-stopwords.txt
│ ├── dutch-stopwords.txt
│ ├── english-stopwords.txt
│ ├── finnish-stopwords.txt
│ ├── french-stopwords.txt
│ ├── generate.php
│ ├── german-stopwords.txt
│ ├── hungarian-stopwords.txt
│ ├── italian-stopwords.txt
│ ├── norwegian-stopwords.txt
│ ├── polish-stopwords.txt
│ ├── portuguese-stopwords.txt
│ ├── russian-stopwords.txt
│ ├── spanish-stopwords.txt
│ ├── swedish-stopwords.txt
│ └── turkish-stopwords.txt
│ ├── Summary.php
│ ├── SummaryPageRank.php
│ ├── TextRank.php
│ └── language-profile.php
├── phpunit.xml
└── tests
├── QuickTest.php
├── bootstrap.php
└── fixtures
├── english1.expected
├── english1.summary
├── english1.txt
├── italian.expected
├── italian.summary
├── italian.txt
├── spanish1.expected
├── spanish1.summary
└── spanish1.txt
/.travis.yml:
--------------------------------------------------------------------------------
1 | language: php
2 | script: phpunit tests
3 |
4 | php:
5 | - 5.4
6 | - 5.5
7 |
8 | before_script:
9 | - php -i
10 | - curl -sS https://getcomposer.org/installer | php
11 | - php composer.phar install
12 |
--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
1 | Copyright (c) 2013, César D. Rodas
2 | All rights reserved.
3 |
4 | Redistribution and use in source and binary forms, with or without modification,
5 | are permitted provided that the following conditions are met:
6 |
7 | * Redistributions of source code must retain the above copyright notice, this
8 | list of conditions and the following disclaimer.
9 |
10 | * Redistributions in binary form must reproduce the above copyright notice, this
11 | list of conditions and the following disclaimer in the documentation and/or
12 | other materials provided with the distribution.
13 |
14 | * Neither the name of the {organization} nor the names of its
15 | contributors may be used to endorse or promote products derived from
16 | this software without specific prior written permission.
17 |
18 | THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
19 | ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
20 | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
21 | DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
22 | ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
23 | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
24 | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
25 | ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26 | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
27 | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 |
--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
1 | TextRank [](https://travis-ci.org/crodas/TextRank)
2 | ========
3 |
4 | extract relevant keywords from a given text
5 |
6 |
7 | How to use it
8 | -------------
9 |
10 | In order to use the class, you must instance a `Config` object.
11 |
12 |
13 | ```php
14 | getKeywords($some_long_text);
25 |
26 | var_dump($keywords);
27 |
28 | ```
29 |
30 | It is possible to get better results by adding few information about the language (`stopword` list, `stemmer` with `pecl install stem`).
31 |
32 |
33 | ```php
34 | addListener(new Stopword);
44 |
45 | $textrank = new TextRank($config);
46 | $keywords = $textrank->getKeywords($some_long_text);
47 |
48 | var_dump($keywords);
49 |
50 | ```
51 | By doing this it will detect the language of the text and will remove common words (from the stopword list). If `ext-stem` is available the results will be even better.
52 |
53 |
54 | Summarize large texts
55 | ---------------------
56 |
57 | This class is also capable of summarizing long texts
58 |
59 | ```php
60 | $config = new \crodas\TextRank\Config;
61 | $config->addListener(new \crodas\TextRank\Stopword);
62 | $analizer = new \crodas\TextRank\Summary($config);
63 | $summary = $analizer->getSummary($text);
64 | ```
65 |
66 | `$summary` is at most 5% of the sentences of the text.
67 |
--------------------------------------------------------------------------------
/composer.json:
--------------------------------------------------------------------------------
1 | {
2 | "name": "crodas/text-rank",
3 | "description": "Extract relevant keywords from a given text",
4 | "require": {
5 | "ext-mbstring": "*",
6 | "crodas/languagedetector": "~0.1"
7 | },
8 | "suggest": {
9 | "ext-stem": "Improves keywords selection"
10 | },
11 | "authors": [
12 | {
13 | "name": "César D. Rodas",
14 | "email": "crodas@php.net"
15 | }
16 | ],
17 | "minimum-stability": "dev",
18 | "autoload": {
19 | "classmap":["lib/"]
20 | }
21 | }
22 |
--------------------------------------------------------------------------------
/composer.lock:
--------------------------------------------------------------------------------
1 | {
2 | "_readme": [
3 | "This file locks the dependencies of your project to a known state",
4 | "Read more about it at http://getcomposer.org/doc/01-basic-usage.md#composer-lock-the-lock-file"
5 | ],
6 | "hash": "8d372775f7c62aeef298600677e8e4ed",
7 | "packages": [
8 | {
9 | "name": "crodas/languagedetector",
10 | "version": "v0.1.1",
11 | "source": {
12 | "type": "git",
13 | "url": "https://github.com/crodas/LanguageDetector.git",
14 | "reference": "07aa8bb806cb71fe4e4352c12232a5c74bf416ed"
15 | },
16 | "dist": {
17 | "type": "zip",
18 | "url": "https://api.github.com/repos/crodas/LanguageDetector/zipball/07aa8bb806cb71fe4e4352c12232a5c74bf416ed",
19 | "reference": "07aa8bb806cb71fe4e4352c12232a5c74bf416ed",
20 | "shasum": ""
21 | },
22 | "require-dev": {
23 | "crodas/autoloader": "~0.1"
24 | },
25 | "type": "library",
26 | "autoload": {
27 | "psr-0": {
28 | "LanguageDetector": "lib/"
29 | }
30 | },
31 | "notification-url": "https://packagist.org/downloads/",
32 | "license": [
33 | "BSD-4-Clause"
34 | ],
35 | "authors": [
36 | {
37 | "name": "César D. Rodas",
38 | "email": "crodas@php.net"
39 | }
40 | ],
41 | "description": "simple library to classify texts",
42 | "time": "2013-11-06 01:26:03"
43 | }
44 | ],
45 | "packages-dev": [
46 |
47 | ],
48 | "aliases": [
49 |
50 | ],
51 | "minimum-stability": "dev",
52 | "stability-flags": [
53 |
54 | ],
55 | "platform": {
56 | "ext-mbstring": "*"
57 | },
58 | "platform-dev": [
59 |
60 | ]
61 | }
62 |
--------------------------------------------------------------------------------
/lib/TextRank/Config.php:
--------------------------------------------------------------------------------
1 | |
35 | +---------------------------------------------------------------------------------+
36 | */
37 | namespace crodas\TextRank;
38 |
39 | class Config
40 | {
41 | protected $events = array();
42 | protected $listeners = array();
43 |
44 | public function __construct()
45 | {
46 | $this->listeners[] = new DefaultEvents;
47 | }
48 |
49 | public function on($event, Closure $callback)
50 | {
51 | if (empty($this->event[$event])) {
52 | $this->event[$event] = [];
53 | }
54 | $this->event[$event][] = $callback;
55 | return $this;
56 | }
57 |
58 | public function addListener($object)
59 | {
60 | array_unshift($this->listeners, $object);
61 | return $this;
62 | }
63 |
64 | public function trigger($ev, $data)
65 | {
66 | if (!empty($this->events[$ev])) {
67 | foreach ($this->events[$ev] as $callback) {
68 | $output = $callback($data);
69 | if (!empty($output)) {
70 | return $output;
71 | }
72 | }
73 | }
74 | foreach ($this->listeners as $object) {
75 | $callback = array($object, $ev);
76 | if (is_callable($callback)) {
77 | $output = $object->$ev($data);
78 | if (!empty($output)) {
79 | return $output;
80 | }
81 | }
82 | }
83 |
84 | throw new \RuntimeException("There was no handler for {$ev}");
85 | }
86 |
87 | }
88 |
--------------------------------------------------------------------------------
/lib/TextRank/DefaultEvents.php:
--------------------------------------------------------------------------------
1 | |
35 | +---------------------------------------------------------------------------------+
36 | */
37 | namespace crodas\TextRank;
38 |
39 | class DefaultEvents
40 | {
41 | public function normalize_keywords(Array $keywords)
42 | {
43 | return array_map(function ($keyword) {
44 | return mb_strtolower($keyword);
45 | }, $keywords);
46 | }
47 |
48 | public function filter_keywords(Array $keywords)
49 | {
50 | return array_filter($keywords, function ($keyword) {
51 | if (is_numeric($keyword)) {
52 | return false;
53 | }
54 |
55 | if ($keyword[0] == mb_strtoupper($keyword[0])) {
56 | return true;
57 | }
58 |
59 | return mb_strlen($keyword) > 3;
60 | });
61 | }
62 |
63 | public function get_sentences($text)
64 | {
65 | $sentences = preg_split('/(\n+)|(\\.\W)/', $text, -1, PREG_SPLIT_NO_EMPTY | PREG_SPLIT_DELIM_CAPTURE);
66 | return array_values(array_filter(array_map('trim', $sentences)));
67 | }
68 |
69 | public function get_words($text)
70 | {
71 | $words = preg_split('/(?:(^\p{P}+)|(\p{P}*\s+\p{P}*)|(\p{P}+$))/', $text, -1, PREG_SPLIT_NO_EMPTY | PREG_SPLIT_DELIM_CAPTURE);
72 | return array_values(array_filter(array_map('trim', $words)));
73 | }
74 | }
75 |
--------------------------------------------------------------------------------
/lib/TextRank/POS/English/Tagger.php:
--------------------------------------------------------------------------------
1 | |
35 | +---------------------------------------------------------------------------------+
36 | */
37 | namespace crodas\TextRank\POS\English;
38 |
39 |
40 | /**
41 | * POS Tagger borrowed from
42 | * http://phpir.com/part-of-speech-tagging
43 | */
44 | class Tagger
45 | {
46 | public static function get(Array $words)
47 | {
48 | return array_map(function($word) {
49 | return $word['token'];
50 | }, array_filter(self::tag($words), function($word) {
51 | switch ($word['tag']) {
52 | case 'NN':
53 | case 'JJ':
54 | case 'NNP':
55 | case 'NNS':
56 | return true;
57 | }
58 | return false;
59 | }));
60 | }
61 | public static function tag(Array $words)
62 | {
63 | static $dict;
64 | if (empty($dict)) {
65 | $dict = require __DIR__ . '/lexicon.php';
66 | }
67 |
68 | $tmp = [];
69 | $return = [];
70 | $nouns = ['NN', 'NNS'];
71 | $i = 0;
72 | foreach ($words as $id => $token) {
73 | $tmp[$i] = ['token' => $token, 'tag' => 'NN'];
74 | $return[$id] = &$tmp[$i];
75 |
76 | // remove trailing full stops
77 | if(substr($token, -1) == '.') {
78 | $token = preg_replace('/\.+$/', '', $token);
79 | }
80 |
81 | // get from dict if set
82 | if(!empty($dict[$token])) {
83 | $tmp[$i]['tag'] = $dict[$token][0];
84 | }
85 |
86 | // Converts verbs after 'the' to nouns
87 | if($i > 0) {
88 | if($tmp[$i - 1]['tag'] == 'DT' &&
89 | in_array($tmp[$i]['tag'],
90 | array('VBD', 'VBP', 'VB'))) {
91 | $tmp[$i]['tag'] = 'NN';
92 | }
93 | }
94 |
95 | // Convert noun to number if . appears
96 | if($tmp[$i]['tag'][0] == 'N' && strpos($token, '.') !== false) {
97 | $tmp[$i]['tag'] = 'CD';
98 | }
99 |
100 | // Convert noun to past particile if ends with 'ed'
101 | if($tmp[$i]['tag'][0] == 'N' && substr($token, -2) == 'ed') {
102 | $tmp[$i]['tag'] = 'VBN';
103 | }
104 |
105 | // Anything that ends 'ly' is an adverb
106 | if(substr($token, -2) == 'ly') {
107 | $tmp[$i]['tag'] = 'RB';
108 | }
109 |
110 | // Common noun to adjective if it ends with al
111 | if(in_array($tmp[$i]['tag'], $nouns)
112 | && substr($token, -2) == 'al') {
113 | $tmp[$i]['tag'] = 'JJ';
114 | }
115 |
116 | // Noun to verb if the word before is 'would'
117 | if($i > 0) {
118 | if($tmp[$i]['tag'] == 'NN'
119 | && $tmp[$i-1]['token'] == 'would') {
120 | $tmp[$i]['tag'] = 'VB';
121 | }
122 | }
123 |
124 | // Convert noun to plural if it ends with an s
125 | if($tmp[$i]['tag'] == 'NN' && substr($token, -1) == 's') {
126 | $tmp[$i]['tag'] = 'NNS';
127 | }
128 |
129 | // Convert common noun to gerund
130 | if(in_array($tmp[$i]['tag'], $nouns)
131 | && substr($token, -3) == 'ing') {
132 | $tmp[$i]['tag'] = 'VBG';
133 | }
134 |
135 | // If we get noun noun, and the second can be a verb, convert to verb
136 | if($i > 0) {
137 | if(in_array($tmp[$i]['tag'], $nouns)
138 | && in_array($tmp[$i-1]['tag'], $nouns)
139 | && isset($dict[$token])) {
140 | if(in_array('VBN', $dict[$token])) {
141 | $tmp[$i]['tag'] = 'VBN';
142 | } else if(in_array('VBZ',
143 | $dict[$token])) {
144 | $tmp[$i]['tag'] = 'VBZ';
145 | }
146 | }
147 | }
148 |
149 | $i++;
150 |
151 | }
152 |
153 | return $return;
154 | }
155 | }
156 |
--------------------------------------------------------------------------------
/lib/TextRank/POS/English/generate.php:
--------------------------------------------------------------------------------
1 | |
35 | +---------------------------------------------------------------------------------+
36 | */
37 | namespace crodas\TextRank;
38 |
39 | use LanguageDetector\Detect;
40 |
41 | /**
42 | * Data files has been borrowed from
43 | * https://github.com/ekorn/Keywords
44 | */
45 | class Stopword extends DefaultEvents
46 | {
47 | protected $stopword;
48 | protected $lang;
49 |
50 | public function normalize_keywords(Array $keywords)
51 | {
52 | $normalized = parent::normalize_keywords($keywords);
53 | $callback = "stem_{$this->lang}";
54 |
55 | $tagger = __NAMESPACE__ . '\POS\\' . ucfirst($this->lang) . '\Tagger';
56 | if (is_callable($callback)) {
57 | return array_map(function ($keyword) use ($callback) {
58 | return $callback($keyword);
59 | }, $normalized);
60 | }
61 | return $normalized;
62 | }
63 |
64 | public function filter_keywords(Array $keywords)
65 | {
66 | $keywords = parent::filter_keywords($keywords);
67 | $tagger = __NAMESPACE__ . '\POS\\' . ucfirst($this->lang) . '\Tagger';
68 |
69 | if (class_exists($tagger)) {
70 | $keywords = $tagger::get($keywords);
71 | }
72 |
73 | $keywords = array_filter($keywords, function ($word) {
74 | $word = mb_strtolower($word);
75 | return empty($this->stopword[$word]);
76 | });
77 |
78 | return $keywords;
79 | }
80 |
81 | protected function getClassifier()
82 | {
83 | static $detect;
84 | if (empty($detect)) {
85 | $detect = Detect::initByPath(__DIR__ . '/language-profile.php');
86 | }
87 | return $detect;
88 | }
89 | protected function getStopwords()
90 | {
91 | static $stopwords;
92 | if (empty($stopwords)) {
93 | $stopwords = require __DIR__ . '/Stopword/Stopword.php';
94 | }
95 | return $stopwords;
96 | }
97 |
98 | public function get_words($text)
99 | {
100 | $detect = $this->getClassifier();
101 | $stopwords = $this->getStopwords();
102 | $lang = $detect->detect($text);
103 | if (!is_string($lang)) {
104 | throw new \RuntimeException("Cannot detect the language of the text");
105 | }
106 | if (empty($stopwords[$lang])) {
107 | throw new \RuntimeException("We dont have an stop word for {$lang}, please add it in " . __DIR__ . "/Stopword/{$lang}-stopwords.txt and run generate.php");
108 | }
109 | $this->stopword = $stopwords[$lang];
110 | $this->lang = $lang;
111 |
112 | return parent::get_words($text);
113 | }
114 | }
115 |
--------------------------------------------------------------------------------
/lib/TextRank/Stopword/Stopword.php:
--------------------------------------------------------------------------------
1 |
3 | array (
4 | 'dnes' => 1,
5 | 'cz' => 1,
6 | 'timto' => 1,
7 | 'budes' => 1,
8 | 'budem' => 1,
9 | 'byli' => 1,
10 | 'jses' => 1,
11 | 'muj' => 1,
12 | 'svym' => 1,
13 | 'ta' => 1,
14 | 'tomto' => 1,
15 | 'tohle' => 1,
16 | 'tuto' => 1,
17 | 'tyto' => 1,
18 | 'jej' => 1,
19 | 'zda' => 1,
20 | 'proc' => 1,
21 | 'mate' => 1,
22 | 'tato' => 1,
23 | 'kam' => 1,
24 | 'tohoto' => 1,
25 | 'kdo' => 1,
26 | 'kteri' => 1,
27 | 'mi' => 1,
28 | 'nam' => 1,
29 | 'tom' => 1,
30 | 'tomuto' => 1,
31 | 'mit' => 1,
32 | 'nic' => 1,
33 | 'proto' => 1,
34 | 'kterou' => 1,
35 | 'byla' => 1,
36 | 'toho' => 1,
37 | 'protoze' => 1,
38 | 'asi' => 1,
39 | 'ho' => 1,
40 | 'nasi' => 1,
41 | 'napiste' => 1,
42 | 're' => 1,
43 | 'coz' => 1,
44 | 'tim' => 1,
45 | 'takze' => 1,
46 | 'svych' => 1,
47 | 'jeji' => 1,
48 | 'svymi' => 1,
49 | 'jste' => 1,
50 | 'aj' => 1,
51 | 'tu' => 1,
52 | 'tedy' => 1,
53 | 'teto bylo' => 1,
54 | 'kde' => 1,
55 | 'ke' => 1,
56 | 'prave' => 1,
57 | 'ji' => 1,
58 | 'nad' => 1,
59 | 'nejsou' => 1,
60 | 'ci' => 1,
61 | 'pod' => 1,
62 | 'tema' => 1,
63 | 'mezi' => 1,
64 | 'pres' => 1,
65 | 'ty' => 1,
66 | 'pak' => 1,
67 | 'vam' => 1,
68 | 'ani' => 1,
69 | 'kdyz' => 1,
70 | 'vsak' => 1,
71 | 'ne' => 1,
72 | 'jsem' => 1,
73 | 'tento' => 1,
74 | 'clanku' => 1,
75 | 'clanky' => 1,
76 | 'aby' => 1,
77 | 'jsme' => 1,
78 | 'pred' => 1,
79 | 'pta' => 1,
80 | 'jejich' => 1,
81 | 'byl' => 1,
82 | 'jeste' => 1,
83 | 'az' => 1,
84 | 'bez' => 1,
85 | 'take' => 1,
86 | 'pouze' => 1,
87 | 'prvni' => 1,
88 | 'vase' => 1,
89 | 'ktera' => 1,
90 | 'nas' => 1,
91 | 'novy' => 1,
92 | 'tipy' => 1,
93 | 'pokud' => 1,
94 | 'muze' => 1,
95 | 'design' => 1,
96 | 'strana' => 1,
97 | 'jeho' => 1,
98 | 'sve' => 1,
99 | 'jine' => 1,
100 | 'zpravy' => 1,
101 | 'nove' => 1,
102 | 'neni vas' => 1,
103 | 'jen' => 1,
104 | 'podle' => 1,
105 | 'zde' => 1,
106 | 'clanek' => 1,
107 | 'uz' => 1,
108 | 'email' => 1,
109 | 'byt' => 1,
110 | 'vice' => 1,
111 | 'bude' => 1,
112 | 'jiz' => 1,
113 | 'nez' => 1,
114 | 'ktery' => 1,
115 | 'by' => 1,
116 | 'ktere' => 1,
117 | 'co' => 1,
118 | 'nebo' => 1,
119 | 'ten' => 1,
120 | 'tak' => 1,
121 | 'ma' => 1,
122 | 'pri' => 1,
123 | 'od' => 1,
124 | 'po' => 1,
125 | 'jsou' => 1,
126 | 'jak' => 1,
127 | 'dalsi' => 1,
128 | 'ale' => 1,
129 | 'si' => 1,
130 | 've' => 1,
131 | 'to' => 1,
132 | 'jako' => 1,
133 | 'za' => 1,
134 | 'zpet' => 1,
135 | 'ze' => 1,
136 | 'do' => 1,
137 | 'pro' => 1,
138 | 'je' => 1,
139 | 'na' => 1,
140 | ),
141 | 'danish' =>
142 | array (
143 | 'af' => 1,
144 | 'alle' => 1,
145 | 'andet' => 1,
146 | 'andre' => 1,
147 | 'at' => 1,
148 | 'begge' => 1,
149 | 'da' => 1,
150 | 'de' => 1,
151 | 'den' => 1,
152 | 'denne' => 1,
153 | 'der' => 1,
154 | 'deres' => 1,
155 | 'det' => 1,
156 | 'dette' => 1,
157 | 'dig' => 1,
158 | 'din' => 1,
159 | 'dog' => 1,
160 | 'du' => 1,
161 | 'ej' => 1,
162 | 'eller' => 1,
163 | 'en' => 1,
164 | 'end' => 1,
165 | 'ene' => 1,
166 | 'eneste' => 1,
167 | 'enhver' => 1,
168 | 'et' => 1,
169 | 'fem' => 1,
170 | 'fire' => 1,
171 | 'flere' => 1,
172 | 'fleste' => 1,
173 | 'for' => 1,
174 | 'fordi' => 1,
175 | 'forrige' => 1,
176 | 'fra' => 1,
177 | 'få' => 1,
178 | 'før' => 1,
179 | 'god' => 1,
180 | 'han' => 1,
181 | 'hans' => 1,
182 | 'har' => 1,
183 | 'hendes' => 1,
184 | 'her' => 1,
185 | 'hun' => 1,
186 | 'hvad' => 1,
187 | 'hvem' => 1,
188 | 'hver' => 1,
189 | 'hvilken' => 1,
190 | 'hvis' => 1,
191 | 'hvor' => 1,
192 | 'hvordan' => 1,
193 | 'hvorfor' => 1,
194 | 'hvornår' => 1,
195 | 'i' => 1,
196 | 'ikke' => 1,
197 | 'ind' => 1,
198 | 'ingen' => 1,
199 | 'intet' => 1,
200 | 'jeg' => 1,
201 | 'jeres' => 1,
202 | 'kan' => 1,
203 | 'kom' => 1,
204 | 'kommer' => 1,
205 | 'lav' => 1,
206 | 'lidt' => 1,
207 | 'lille' => 1,
208 | 'man' => 1,
209 | 'mand' => 1,
210 | 'mange' => 1,
211 | 'med' => 1,
212 | 'meget' => 1,
213 | 'men' => 1,
214 | 'mens' => 1,
215 | 'mere' => 1,
216 | 'mig' => 1,
217 | 'ned' => 1,
218 | 'ni' => 1,
219 | 'nogen' => 1,
220 | 'noget' => 1,
221 | 'ny' => 1,
222 | 'nyt' => 1,
223 | 'nær' => 1,
224 | 'næste' => 1,
225 | 'næsten' => 1,
226 | 'og' => 1,
227 | 'op' => 1,
228 | 'otte' => 1,
229 | 'over' => 1,
230 | 'på' => 1,
231 | 'se' => 1,
232 | 'seks' => 1,
233 | 'ses' => 1,
234 | 'som' => 1,
235 | 'stor' => 1,
236 | 'store' => 1,
237 | 'syv' => 1,
238 | 'ti' => 1,
239 | 'til' => 1,
240 | 'to' => 1,
241 | 'tre' => 1,
242 | 'ud' => 1,
243 | 'var' => 1,
244 | ),
245 | 'dutch' =>
246 | array (
247 | 'aan' => 1,
248 | 'af' => 1,
249 | 'al' => 1,
250 | 'als' => 1,
251 | 'bij' => 1,
252 | 'dan' => 1,
253 | 'dat' => 1,
254 | 'die' => 1,
255 | 'dit' => 1,
256 | 'een' => 1,
257 | 'en' => 1,
258 | 'er' => 1,
259 | 'had' => 1,
260 | 'heb' => 1,
261 | 'hem' => 1,
262 | 'het' => 1,
263 | 'hij' => 1,
264 | 'hoe' => 1,
265 | 'hun' => 1,
266 | 'ik' => 1,
267 | 'in' => 1,
268 | 'is' => 1,
269 | 'je' => 1,
270 | 'kan' => 1,
271 | 'me' => 1,
272 | 'men' => 1,
273 | 'met' => 1,
274 | 'mij' => 1,
275 | 'nog' => 1,
276 | 'nu' => 1,
277 | 'of' => 1,
278 | 'ons' => 1,
279 | 'ook' => 1,
280 | 'te' => 1,
281 | 'tot' => 1,
282 | 'uit' => 1,
283 | 'van' => 1,
284 | 'was' => 1,
285 | 'wat' => 1,
286 | 'we' => 1,
287 | 'wel' => 1,
288 | 'wij' => 1,
289 | 'zal' => 1,
290 | 'ze' => 1,
291 | 'zei' => 1,
292 | 'zij' => 1,
293 | 'zo' => 1,
294 | 'zou' => 1,
295 | ),
296 | 'english' =>
297 | array (
298 | 'a' => 1,
299 | 'about' => 1,
300 | 'above' => 1,
301 | 'after' => 1,
302 | 'again' => 1,
303 | 'against' => 1,
304 | 'all' => 1,
305 | 'am' => 1,
306 | 'an' => 1,
307 | 'and' => 1,
308 | 'any' => 1,
309 | 'are' => 1,
310 | 'aren\'t' => 1,
311 | 'as' => 1,
312 | 'at' => 1,
313 | 'be' => 1,
314 | 'because' => 1,
315 | 'been' => 1,
316 | 'before' => 1,
317 | 'being' => 1,
318 | 'below' => 1,
319 | 'between' => 1,
320 | 'both' => 1,
321 | 'but' => 1,
322 | 'by' => 1,
323 | 'can\'t' => 1,
324 | 'cannot' => 1,
325 | 'could' => 1,
326 | 'couldn\'t' => 1,
327 | 'did' => 1,
328 | 'didn\'t' => 1,
329 | 'do' => 1,
330 | 'does' => 1,
331 | 'doesn\'t' => 1,
332 | 'doing' => 1,
333 | 'don\'t' => 1,
334 | 'down' => 1,
335 | 'during' => 1,
336 | 'each' => 1,
337 | 'e.g.' => 1,
338 | 'few' => 1,
339 | 'for' => 1,
340 | 'from' => 1,
341 | 'further' => 1,
342 | 'had' => 1,
343 | 'hadn\'t' => 1,
344 | 'has' => 1,
345 | 'hasn\'t' => 1,
346 | 'have' => 1,
347 | 'haven\'t' => 1,
348 | 'having' => 1,
349 | 'he' => 1,
350 | 'he\'d' => 1,
351 | 'he\'ll' => 1,
352 | 'he\'s' => 1,
353 | 'her' => 1,
354 | 'here' => 1,
355 | 'here\'s' => 1,
356 | 'hers' => 1,
357 | 'herself' => 1,
358 | 'him' => 1,
359 | 'himself' => 1,
360 | 'his' => 1,
361 | 'how' => 1,
362 | 'how\'s' => 1,
363 | 'i' => 1,
364 | 'i\'d' => 1,
365 | 'i\'ll' => 1,
366 | 'i\'m' => 1,
367 | 'i\'ve' => 1,
368 | 'if' => 1,
369 | 'in' => 1,
370 | 'into' => 1,
371 | 'is' => 1,
372 | 'isn\'t' => 1,
373 | 'it' => 1,
374 | 'it\'s' => 1,
375 | 'its' => 1,
376 | 'itself' => 1,
377 | 'let\'s' => 1,
378 | 'me' => 1,
379 | 'more' => 1,
380 | 'most' => 1,
381 | 'mustn\'t' => 1,
382 | 'my' => 1,
383 | 'myself' => 1,
384 | 'no' => 1,
385 | 'nor' => 1,
386 | 'not' => 1,
387 | 'of' => 1,
388 | 'off' => 1,
389 | 'on' => 1,
390 | 'once' => 1,
391 | 'only' => 1,
392 | 'or' => 1,
393 | 'other' => 1,
394 | 'ought' => 1,
395 | 'our' => 1,
396 | 'ours' => 1,
397 | ' ourselves' => 1,
398 | 'out' => 1,
399 | 'over' => 1,
400 | 'own' => 1,
401 | 'same' => 1,
402 | 'shan\'t' => 1,
403 | 'she' => 1,
404 | 'she\'d' => 1,
405 | 'she\'ll' => 1,
406 | 'she\'s' => 1,
407 | 'should' => 1,
408 | 'shouldn\'t' => 1,
409 | 'so' => 1,
410 | 'some' => 1,
411 | 'such' => 1,
412 | 'than' => 1,
413 | 'that' => 1,
414 | 'that\'s' => 1,
415 | 'the' => 1,
416 | 'their' => 1,
417 | 'theirs' => 1,
418 | 'them' => 1,
419 | 'themselves' => 1,
420 | 'then' => 1,
421 | 'there' => 1,
422 | 'there\'s' => 1,
423 | 'these' => 1,
424 | 'they' => 1,
425 | 'they\'d' => 1,
426 | 'they\'ll' => 1,
427 | 'they\'re' => 1,
428 | 'they\'ve' => 1,
429 | 'this' => 1,
430 | 'those' => 1,
431 | 'through' => 1,
432 | 'to' => 1,
433 | 'too' => 1,
434 | 'under' => 1,
435 | 'until' => 1,
436 | 'up' => 1,
437 | 'very' => 1,
438 | 'was' => 1,
439 | 'wasn\'t' => 1,
440 | 'we' => 1,
441 | 'we\'d' => 1,
442 | 'we\'ll' => 1,
443 | 'we\'re' => 1,
444 | 'we\'ve' => 1,
445 | 'were' => 1,
446 | 'weren\'t' => 1,
447 | 'what' => 1,
448 | 'what\'s' => 1,
449 | 'when' => 1,
450 | 'when\'s' => 1,
451 | 'where' => 1,
452 | 'where\'s' => 1,
453 | 'which' => 1,
454 | 'while' => 1,
455 | 'who' => 1,
456 | 'who\'s' => 1,
457 | 'whom' => 1,
458 | 'why' => 1,
459 | 'why\'s' => 1,
460 | 'with' => 1,
461 | 'won\'t' => 1,
462 | 'would' => 1,
463 | 'wouldn\'t' => 1,
464 | 'you' => 1,
465 | 'you\'d' => 1,
466 | 'you\'ll' => 1,
467 | 'you\'re' => 1,
468 | 'you\'ve' => 1,
469 | 'your' => 1,
470 | 'yours' => 1,
471 | 'yourself' => 1,
472 | 'yourselves' => 1,
473 | ),
474 | 'finnish' =>
475 | array (
476 | 'aiemmin' => 1,
477 | 'aika' => 1,
478 | 'aikaa' => 1,
479 | 'aikaan' => 1,
480 | 'aikaisemmin' => 1,
481 | 'aikaisin' => 1,
482 | 'aikajen' => 1,
483 | 'aikana' => 1,
484 | 'aikoina' => 1,
485 | 'aikoo' => 1,
486 | 'aikovat' => 1,
487 | 'aina' => 1,
488 | 'ainakaan' => 1,
489 | 'ainakin' => 1,
490 | 'ainoa' => 1,
491 | 'ainoat' => 1,
492 | 'aiomme' => 1,
493 | 'aion' => 1,
494 | 'aiotte' => 1,
495 | 'aist' => 1,
496 | 'aivan' => 1,
497 | 'ajan' => 1,
498 | 'älä' => 1,
499 | 'alas' => 1,
500 | 'alemmas' => 1,
501 | 'älköön' => 1,
502 | 'alkuisin' => 1,
503 | 'alkuun' => 1,
504 | 'alla' => 1,
505 | 'alle' => 1,
506 | 'aloitamme' => 1,
507 | 'aloitan' => 1,
508 | 'aloitat' => 1,
509 | 'aloitatte' => 1,
510 | 'aloitattivat' => 1,
511 | 'aloitettava' => 1,
512 | 'aloitettevaksi' => 1,
513 | 'aloitettu' => 1,
514 | 'aloitimme' => 1,
515 | 'aloitin' => 1,
516 | 'aloitit' => 1,
517 | 'aloititte' => 1,
518 | 'aloittaa' => 1,
519 | 'aloittamatta' => 1,
520 | 'aloitti' => 1,
521 | 'aloittivat' => 1,
522 | 'alta' => 1,
523 | 'aluksi' => 1,
524 | 'alussa' => 1,
525 | 'alusta' => 1,
526 | 'annettavaksi' => 1,
527 | 'annetteva' => 1,
528 | 'annettu' => 1,
529 | 'antaa' => 1,
530 | 'antamatta' => 1,
531 | 'antoi' => 1,
532 | 'aoua' => 1,
533 | 'apu' => 1,
534 | 'asia' => 1,
535 | 'asiaa' => 1,
536 | 'asian' => 1,
537 | 'asiasta' => 1,
538 | 'asiat' => 1,
539 | 'asioiden' => 1,
540 | 'asioihin' => 1,
541 | 'asioita' => 1,
542 | 'asti' => 1,
543 | 'avuksi' => 1,
544 | 'avulla' => 1,
545 | 'avun' => 1,
546 | 'avutta' => 1,
547 | 'edellä' => 1,
548 | 'edelle' => 1,
549 | 'edelleen' => 1,
550 | 'edeltä' => 1,
551 | 'edemmäs' => 1,
552 | 'edes' => 1,
553 | 'edessä' => 1,
554 | 'edestä' => 1,
555 | 'ehkä' => 1,
556 | 'ei' => 1,
557 | 'eikä' => 1,
558 | 'eilen' => 1,
559 | 'eivät' => 1,
560 | 'eli' => 1,
561 | 'ellei' => 1,
562 | 'elleivät' => 1,
563 | 'ellemme' => 1,
564 | 'ellen' => 1,
565 | 'ellet' => 1,
566 | 'ellette' => 1,
567 | 'emme' => 1,
568 | 'en' => 1,
569 | 'enää' => 1,
570 | 'enemmän' => 1,
571 | 'eniten' => 1,
572 | 'ennen' => 1,
573 | 'ensi' => 1,
574 | 'ensimmäinen' => 1,
575 | 'ensimmäiseksi' => 1,
576 | 'ensimmäisen' => 1,
577 | 'ensimmäisenä' => 1,
578 | 'ensimmäiset' => 1,
579 | 'ensimmäisiä' => 1,
580 | 'ensimmäisiksi' => 1,
581 | 'ensimmäisinä' => 1,
582 | 'ensimmäistä' => 1,
583 | 'ensin' => 1,
584 | 'entinen' => 1,
585 | 'entisen' => 1,
586 | 'entisiä' => 1,
587 | 'entistä' => 1,
588 | 'entisten' => 1,
589 | 'eräät' => 1,
590 | 'eräiden' => 1,
591 | 'eräs' => 1,
592 | 'eri' => 1,
593 | 'erittäin' => 1,
594 | 'erityisesti' => 1,
595 | 'esi' => 1,
596 | 'esiin' => 1,
597 | 'esillä' => 1,
598 | 'esimerkiksi' => 1,
599 | 'et' => 1,
600 | 'eteen' => 1,
601 | 'etenkin' => 1,
602 | 'että' => 1,
603 | 'ette' => 1,
604 | 'ettei' => 1,
605 | 'halua' => 1,
606 | 'haluaa' => 1,
607 | 'haluamatta' => 1,
608 | 'haluamme' => 1,
609 | 'haluan' => 1,
610 | 'haluat' => 1,
611 | 'haluatte' => 1,
612 | 'haluavat' => 1,
613 | 'halunnut' => 1,
614 | 'halusi' => 1,
615 | 'halusimme' => 1,
616 | 'halusin' => 1,
617 | 'halusit' => 1,
618 | 'halusitte' => 1,
619 | 'halusivat' => 1,
620 | 'halutessa' => 1,
621 | 'haluton' => 1,
622 | 'hän' => 1,
623 | 'häneen' => 1,
624 | 'hänellä' => 1,
625 | 'hänelle' => 1,
626 | 'häneltä' => 1,
627 | 'hänen' => 1,
628 | 'hänessä' => 1,
629 | 'hänestä' => 1,
630 | 'hänet' => 1,
631 | 'he' => 1,
632 | 'hei' => 1,
633 | 'heidän' => 1,
634 | 'heihin' => 1,
635 | 'heille' => 1,
636 | 'heiltä' => 1,
637 | 'heissä' => 1,
638 | 'heistä' => 1,
639 | 'heitä' => 1,
640 | 'helposti' => 1,
641 | 'heti' => 1,
642 | 'hetkellä' => 1,
643 | 'hieman' => 1,
644 | 'huolimatta' => 1,
645 | 'huomenna' => 1,
646 | 'hyvä' => 1,
647 | 'hyvää' => 1,
648 | 'hyvät' => 1,
649 | 'hyviä' => 1,
650 | 'hyvien' => 1,
651 | 'hyviin' => 1,
652 | 'hyviksi' => 1,
653 | 'hyville' => 1,
654 | 'hyviltä' => 1,
655 | 'hyvin' => 1,
656 | 'hyvinä' => 1,
657 | 'hyvissä' => 1,
658 | 'hyvistä' => 1,
659 | 'ihan' => 1,
660 | 'ilman' => 1,
661 | 'ilmeisesti' => 1,
662 | 'itse' => 1,
663 | 'itseään' => 1,
664 | 'itsensä' => 1,
665 | 'ja' => 1,
666 | 'jää' => 1,
667 | 'jälkeen' => 1,
668 | 'jälleen' => 1,
669 | 'jo' => 1,
670 | 'johon' => 1,
671 | 'joiden' => 1,
672 | 'joihin' => 1,
673 | 'joiksi' => 1,
674 | 'joilla' => 1,
675 | 'joille' => 1,
676 | 'joilta' => 1,
677 | 'joissa' => 1,
678 | 'joista' => 1,
679 | 'joita' => 1,
680 | 'joka' => 1,
681 | 'jokainen' => 1,
682 | 'jokin' => 1,
683 | 'joko' => 1,
684 | 'joku' => 1,
685 | 'jolla' => 1,
686 | 'jolle' => 1,
687 | 'jolloin' => 1,
688 | 'jolta' => 1,
689 | 'jompikumpi' => 1,
690 | 'jonka' => 1,
691 | 'jonkin' => 1,
692 | 'jonne' => 1,
693 | 'joo' => 1,
694 | 'jopa' => 1,
695 | 'jos' => 1,
696 | 'joskus' => 1,
697 | 'jossa' => 1,
698 | 'josta' => 1,
699 | 'jota' => 1,
700 | 'jotain' => 1,
701 | 'joten' => 1,
702 | 'jotenkin' => 1,
703 | 'jotenkuten' => 1,
704 | 'jotka' => 1,
705 | 'jotta' => 1,
706 | 'jouduimme' => 1,
707 | 'jouduin' => 1,
708 | 'jouduit' => 1,
709 | 'jouduitte' => 1,
710 | 'joudumme' => 1,
711 | 'joudun' => 1,
712 | 'joudutte' => 1,
713 | 'joukkoon' => 1,
714 | 'joukossa' => 1,
715 | 'joukosta' => 1,
716 | 'joutua' => 1,
717 | 'joutui' => 1,
718 | 'joutuivat' => 1,
719 | 'joutumaan' => 1,
720 | 'joutuu' => 1,
721 | 'joutuvat' => 1,
722 | 'juuri' => 1,
723 | 'kahdeksan' => 1,
724 | 'kahdeksannen' => 1,
725 | 'kahdella' => 1,
726 | ' kahdelle' => 1,
727 | 'kahdelta' => 1,
728 | 'kahden' => 1,
729 | 'kahdessa' => 1,
730 | 'kahdesta' => 1,
731 | 'kahta' => 1,
732 | 'kahteen' => 1,
733 | 'kai' => 1,
734 | 'kaiken' => 1,
735 | 'kaikille' => 1,
736 | 'kaikilta' => 1,
737 | 'kaikkea' => 1,
738 | 'kaikki' => 1,
739 | 'kaikkia' => 1,
740 | 'kaikkiaan' => 1,
741 | 'kaikkialla' => 1,
742 | 'kaikkialle' => 1,
743 | 'kaikkialta' => 1,
744 | 'kaikkien' => 1,
745 | 'kaikkin' => 1,
746 | 'kaksi' => 1,
747 | 'kannalta' => 1,
748 | 'kannattaa' => 1,
749 | 'kanssa' => 1,
750 | 'kanssaan' => 1,
751 | 'kanssamme' => 1,
752 | 'kanssani' => 1,
753 | 'kanssanne' => 1,
754 | 'kanssasi' => 1,
755 | 'kauan' => 1,
756 | 'kauemmas' => 1,
757 | 'kautta' => 1,
758 | 'kehen' => 1,
759 | 'keiden' => 1,
760 | 'keihin' => 1,
761 | 'keiksi' => 1,
762 | 'keillä' => 1,
763 | 'keille' => 1,
764 | 'keiltä' => 1,
765 | 'keinä' => 1,
766 | 'keissä' => 1,
767 | 'keistä' => 1,
768 | 'keitä' => 1,
769 | 'keittä' => 1,
770 | 'keitten' => 1,
771 | 'keneen' => 1,
772 | 'keneksi' => 1,
773 | 'kenellä' => 1,
774 | 'kenelle' => 1,
775 | 'keneltä' => 1,
776 | 'kenen' => 1,
777 | 'kenenä' => 1,
778 | 'kenessä' => 1,
779 | 'kenestä' => 1,
780 | 'kenet' => 1,
781 | 'kenettä' => 1,
782 | 'kennessästä' => 1,
783 | 'kerran' => 1,
784 | 'kerta' => 1,
785 | 'kertaa' => 1,
786 | 'kesken' => 1,
787 | 'keskimäärin' => 1,
788 | 'ketä' => 1,
789 | 'ketkä' => 1,
790 | 'kiitos' => 1,
791 | 'kohti' => 1,
792 | 'koko' => 1,
793 | 'kokonaan' => 1,
794 | 'kolmas' => 1,
795 | 'kolme' => 1,
796 | 'kolmen' => 1,
797 | 'kolmesti' => 1,
798 | 'koska' => 1,
799 | 'koskaan' => 1,
800 | 'kovin' => 1,
801 | 'kuin' => 1,
802 | 'kuinka' => 1,
803 | 'kuitenkaan' => 1,
804 | 'kuitenkin' => 1,
805 | 'kuka' => 1,
806 | 'kukaan' => 1,
807 | 'kukin' => 1,
808 | 'kumpainen' => 1,
809 | 'kumpainenkaan' => 1,
810 | 'kumpi' => 1,
811 | 'kumpikaan' => 1,
812 | 'kumpikin' => 1,
813 | 'kun' => 1,
814 | 'kuten' => 1,
815 | 'kuuden' => 1,
816 | 'kuusi' => 1,
817 | 'kuutta' => 1,
818 | 'kyllä' => 1,
819 | 'kymmenen' => 1,
820 | 'kyse' => 1,
821 | 'lähekkäin' => 1,
822 | 'lähellä' => 1,
823 | 'lähelle' => 1,
824 | 'läheltä' => 1,
825 | 'lähemmäs' => 1,
826 | 'lähes' => 1,
827 | 'lähinnä' => 1,
828 | 'lähtien' => 1,
829 | 'läpi' => 1,
830 | 'liian' => 1,
831 | 'liki' => 1,
832 | 'lisää' => 1,
833 | 'lisäksi' => 1,
834 | 'luo' => 1,
835 | 'mahdollisimman' => 1,
836 | 'mahdollista' => 1,
837 | 'me' => 1,
838 | 'meidän' => 1,
839 | 'meillä' => 1,
840 | 'meille' => 1,
841 | 'melkein' => 1,
842 | 'melko' => 1,
843 | 'menee' => 1,
844 | 'meneet' => 1,
845 | 'menemme' => 1,
846 | 'menen' => 1,
847 | 'menet' => 1,
848 | 'menette' => 1,
849 | 'menevät' => 1,
850 | 'meni' => 1,
851 | 'menimme' => 1,
852 | 'menin' => 1,
853 | 'menit' => 1,
854 | 'menivät' => 1,
855 | 'mennessä' => 1,
856 | 'mennyt' => 1,
857 | 'menossa' => 1,
858 | 'mihin' => 1,
859 | 'mikä' => 1,
860 | 'mikään' => 1,
861 | 'mikäli' => 1,
862 | 'mikin' => 1,
863 | 'miksi' => 1,
864 | 'milloin' => 1,
865 | 'minä' => 1,
866 | 'minne' => 1,
867 | 'minun' => 1,
868 | 'minut' => 1,
869 | 'missä' => 1,
870 | 'mistä' => 1,
871 | 'mitä' => 1,
872 | 'mitään' => 1,
873 | 'miten' => 1,
874 | 'moi' => 1,
875 | 'molemmat' => 1,
876 | 'mones' => 1,
877 | 'monesti' => 1,
878 | 'monet' => 1,
879 | 'moni' => 1,
880 | 'moniaalla' => 1,
881 | 'moniaalle' => 1,
882 | 'moniaalta' => 1,
883 | 'monta' => 1,
884 | 'muassa' => 1,
885 | 'muiden' => 1,
886 | 'muita' => 1,
887 | 'muka' => 1,
888 | 'mukaan' => 1,
889 | 'mukaansa' => 1,
890 | 'mukana' => 1,
891 | 'mutta' => 1,
892 | 'muu' => 1,
893 | 'muualla' => 1,
894 | 'muualle' => 1,
895 | 'muualta' => 1,
896 | 'muuanne' => 1,
897 | 'muulloin' => 1,
898 | 'muun' => 1,
899 | 'muut' => 1,
900 | 'muuta' => 1,
901 | 'muutama' => 1,
902 | 'muutaman' => 1,
903 | 'muuten' => 1,
904 | 'myöhemmin' => 1,
905 | 'myös' => 1,
906 | 'myöskään' => 1,
907 | 'myöskin' => 1,
908 | 'myötä' => 1,
909 | 'näiden' => 1,
910 | 'näin' => 1,
911 | 'näissä' => 1,
912 | 'näissähin' => 1,
913 | 'näissälle' => 1,
914 | 'näissältä' => 1,
915 | 'näissästä' => 1,
916 | 'näitä' => 1,
917 | 'nämä' => 1,
918 | 'ne' => 1,
919 | 'neljä' => 1,
920 | 'neljää' => 1,
921 | 'neljän' => 1,
922 | 'niiden' => 1,
923 | 'niin' => 1,
924 | 'niistä' => 1,
925 | 'niitä' => 1,
926 | 'noin' => 1,
927 | 'nopeammin' => 1,
928 | 'nopeasti' => 1,
929 | 'nopeiten' => 1,
930 | 'nro' => 1,
931 | 'nuo' => 1,
932 | 'nyt' => 1,
933 | 'ohi' => 1,
934 | 'oikein' => 1,
935 | 'ole' => 1,
936 | 'olemme' => 1,
937 | 'olen' => 1,
938 | 'olet' => 1,
939 | 'olette' => 1,
940 | 'oleva' => 1,
941 | 'olevan' => 1,
942 | 'olevat' => 1,
943 | 'oli' => 1,
944 | 'olimme' => 1,
945 | 'olin' => 1,
946 | 'olisi' => 1,
947 | 'olisimme' => 1,
948 | 'olisin' => 1,
949 | 'olisit' => 1,
950 | 'olisitte' => 1,
951 | 'olisivat' => 1,
952 | 'olit' => 1,
953 | 'olitte' => 1,
954 | 'olivat' => 1,
955 | 'olla' => 1,
956 | 'olleet' => 1,
957 | 'olli' => 1,
958 | 'ollut' => 1,
959 | 'oma' => 1,
960 | 'omaa' => 1,
961 | 'omaan' => 1,
962 | 'omaksi' => 1,
963 | 'omalle' => 1,
964 | 'omalta' => 1,
965 | 'oman' => 1,
966 | 'omassa' => 1,
967 | 'omat' => 1,
968 | 'omia' => 1,
969 | 'omien' => 1,
970 | 'omiin' => 1,
971 | 'omiksi' => 1,
972 | 'omille' => 1,
973 | 'omilta' => 1,
974 | 'omissa' => 1,
975 | 'omista' => 1,
976 | ' on' => 1,
977 | 'onkin' => 1,
978 | 'onko' => 1,
979 | 'ovat' => 1,
980 | 'päälle' => 1,
981 | 'paikoittain' => 1,
982 | 'paitsi' => 1,
983 | 'pakosti' => 1,
984 | 'paljon' => 1,
985 | 'paremmin' => 1,
986 | 'parempi' => 1,
987 | 'parhaillaan' => 1,
988 | 'parhaiten' => 1,
989 | 'peräti' => 1,
990 | 'perusteella' => 1,
991 | 'pian' => 1,
992 | 'pieneen' => 1,
993 | 'pieneksi' => 1,
994 | 'pienellä' => 1,
995 | 'pienelle' => 1,
996 | 'pieneltä' => 1,
997 | 'pienempi' => 1,
998 | 'pienestä' => 1,
999 | 'pieni' => 1,
1000 | 'pienin' => 1,
1001 | 'puolesta' => 1,
1002 | 'puolestaan' => 1,
1003 | 'runsaasti' => 1,
1004 | 'saakka' => 1,
1005 | 'sadam' => 1,
1006 | 'sama' => 1,
1007 | 'samaa' => 1,
1008 | 'samaan' => 1,
1009 | 'samalla' => 1,
1010 | 'samallalta' => 1,
1011 | 'samallassa' => 1,
1012 | 'samallasta' => 1,
1013 | 'saman' => 1,
1014 | 'samat' => 1,
1015 | 'samoin' => 1,
1016 | 'sata' => 1,
1017 | 'sataa' => 1,
1018 | 'satojen' => 1,
1019 | 'se' => 1,
1020 | 'seitsemän' => 1,
1021 | 'sekä' => 1,
1022 | 'sen' => 1,
1023 | 'seuraavat' => 1,
1024 | 'siellä' => 1,
1025 | 'sieltä' => 1,
1026 | 'siihen' => 1,
1027 | 'siinä' => 1,
1028 | 'siis' => 1,
1029 | 'siitä' => 1,
1030 | 'sijaan' => 1,
1031 | 'siksi' => 1,
1032 | 'sillä' => 1,
1033 | 'silloin' => 1,
1034 | 'silti' => 1,
1035 | 'sinä' => 1,
1036 | 'sinne' => 1,
1037 | 'sinua' => 1,
1038 | 'sinulle' => 1,
1039 | 'sinulta' => 1,
1040 | 'sinun' => 1,
1041 | 'sinussa' => 1,
1042 | 'sinusta' => 1,
1043 | 'sinut' => 1,
1044 | 'sisäkkäin' => 1,
1045 | 'sisällä' => 1,
1046 | 'sitä' => 1,
1047 | 'siten' => 1,
1048 | 'sitten' => 1,
1049 | 'suoraan' => 1,
1050 | 'suuntaan' => 1,
1051 | 'suuren' => 1,
1052 | 'suuret' => 1,
1053 | 'suuri' => 1,
1054 | 'suuria' => 1,
1055 | 'suurin' => 1,
1056 | 'suurten' => 1,
1057 | 'taa' => 1,
1058 | 'täällä' => 1,
1059 | 'täältä' => 1,
1060 | 'taas' => 1,
1061 | 'taemmas' => 1,
1062 | 'tähän' => 1,
1063 | 'tahansa' => 1,
1064 | 'tai' => 1,
1065 | 'takaa' => 1,
1066 | 'takaisin' => 1,
1067 | 'takana' => 1,
1068 | 'takia' => 1,
1069 | 'tällä' => 1,
1070 | 'tällöin' => 1,
1071 | 'tämä' => 1,
1072 | 'tämän' => 1,
1073 | 'tänä' => 1,
1074 | 'tänään' => 1,
1075 | 'tänne' => 1,
1076 | 'tapauksessa' => 1,
1077 | 'tässä' => 1,
1078 | 'tästä' => 1,
1079 | 'tätä' => 1,
1080 | 'täten' => 1,
1081 | 'tavalla' => 1,
1082 | 'tavoitteena' => 1,
1083 | 'täysin' => 1,
1084 | 'täytyvät' => 1,
1085 | 'täytyy' => 1,
1086 | 'te' => 1,
1087 | 'tietysti' => 1,
1088 | 'todella' => 1,
1089 | 'toinen' => 1,
1090 | 'toisaalla' => 1,
1091 | 'toisaalle' => 1,
1092 | 'toisaalta' => 1,
1093 | 'toiseen' => 1,
1094 | 'toiseksi' => 1,
1095 | 'toisella' => 1,
1096 | 'toiselle' => 1,
1097 | 'toiselta' => 1,
1098 | 'toisemme' => 1,
1099 | 'toisen' => 1,
1100 | 'toisensa' => 1,
1101 | 'toisessa' => 1,
1102 | 'toisesta' => 1,
1103 | 'toista' => 1,
1104 | 'toistaiseksi' => 1,
1105 | 'toki' => 1,
1106 | 'tosin' => 1,
1107 | 'tuhannen' => 1,
1108 | 'tuhat' => 1,
1109 | 'tule' => 1,
1110 | 'tulee' => 1,
1111 | 'tulemme' => 1,
1112 | 'tulen' => 1,
1113 | 'tulet' => 1,
1114 | 'tulette' => 1,
1115 | 'tulevat' => 1,
1116 | 'tulimme' => 1,
1117 | 'tulin' => 1,
1118 | 'tulisi' => 1,
1119 | 'tulisimme' => 1,
1120 | 'tulisin' => 1,
1121 | 'tulisit' => 1,
1122 | 'tulisitte' => 1,
1123 | 'tulisivat' => 1,
1124 | 'tulit' => 1,
1125 | 'tulitte' => 1,
1126 | 'tulivat' => 1,
1127 | 'tulla' => 1,
1128 | 'tulleet' => 1,
1129 | 'tullut' => 1,
1130 | 'tuntuu' => 1,
1131 | 'tuo' => 1,
1132 | 'tuolla' => 1,
1133 | 'tuolloin' => 1,
1134 | 'tuolta' => 1,
1135 | 'tuonne' => 1,
1136 | 'tuskin' => 1,
1137 | 'tykö' => 1,
1138 | 'usea' => 1,
1139 | 'useasti' => 1,
1140 | 'useimmiten' => 1,
1141 | 'usein' => 1,
1142 | 'useita' => 1,
1143 | 'uudeksi' => 1,
1144 | 'uudelleen' => 1,
1145 | 'uuden' => 1,
1146 | 'uudet' => 1,
1147 | 'uusi' => 1,
1148 | 'uusia' => 1,
1149 | 'uusien' => 1,
1150 | 'uusinta' => 1,
1151 | 'uuteen' => 1,
1152 | 'uutta' => 1,
1153 | 'vaan' => 1,
1154 | 'vähän' => 1,
1155 | 'vähemmän' => 1,
1156 | 'vähintään' => 1,
1157 | 'vähiten' => 1,
1158 | 'vai' => 1,
1159 | 'vaiheessa' => 1,
1160 | 'vaikea' => 1,
1161 | 'vaikean' => 1,
1162 | 'vaikeat' => 1,
1163 | 'vaikeilla' => 1,
1164 | 'vaikeille' => 1,
1165 | 'vaikeilta' => 1,
1166 | 'vaikeissa' => 1,
1167 | 'vaikeista' => 1,
1168 | 'vaikka' => 1,
1169 | 'vain' => 1,
1170 | 'välillä' => 1,
1171 | 'varmasti' => 1,
1172 | 'varsin' => 1,
1173 | 'varsinkin' => 1,
1174 | 'varten' => 1,
1175 | 'vasta' => 1,
1176 | 'vastaan' => 1,
1177 | 'vastakkain' => 1,
1178 | 'verran' => 1,
1179 | 'vielä' => 1,
1180 | 'vierekkäin' => 1,
1181 | 'vieri' => 1,
1182 | 'viiden' => 1,
1183 | 'viime' => 1,
1184 | 'viimeinen' => 1,
1185 | 'viimeisen' => 1,
1186 | 'viimeksi' => 1,
1187 | 'viisi' => 1,
1188 | 'voi' => 1,
1189 | 'voidaan' => 1,
1190 | 'voimme' => 1,
1191 | 'voin' => 1,
1192 | 'voisi' => 1,
1193 | 'voit' => 1,
1194 | 'voitte' => 1,
1195 | 'voivat' => 1,
1196 | 'vuoden' => 1,
1197 | 'vuoksi' => 1,
1198 | 'vuosi' => 1,
1199 | 'vuosien' => 1,
1200 | 'vuosina' => 1,
1201 | 'vuotta' => 1,
1202 | 'yhä' => 1,
1203 | 'yhdeksän' => 1,
1204 | 'yhden' => 1,
1205 | 'yhdessä' => 1,
1206 | 'yhtä' => 1,
1207 | 'yhtäällä' => 1,
1208 | 'yhtäälle' => 1,
1209 | 'yhtäältä' => 1,
1210 | 'yhtään' => 1,
1211 | 'yhteen' => 1,
1212 | 'yhteensä' => 1,
1213 | 'yhteydessä' => 1,
1214 | 'yhteyteen' => 1,
1215 | 'yksi' => 1,
1216 | 'yksin' => 1,
1217 | 'yksittäin' => 1,
1218 | 'yleensä' => 1,
1219 | 'ylemmäs' => 1,
1220 | 'yli' => 1,
1221 | 'ylös' => 1,
1222 | 'ympäri' => 1,
1223 | ),
1224 | 'french' =>
1225 | array (
1226 | 'alors' => 1,
1227 | 'au' => 1,
1228 | 'aucuns' => 1,
1229 | 'aussi' => 1,
1230 | 'autre' => 1,
1231 | 'avant' => 1,
1232 | 'avec' => 1,
1233 | 'avoir' => 1,
1234 | 'bon' => 1,
1235 | 'car' => 1,
1236 | 'ce' => 1,
1237 | 'cela' => 1,
1238 | 'ces' => 1,
1239 | 'ceux' => 1,
1240 | 'chaque' => 1,
1241 | 'ci' => 1,
1242 | 'comme' => 1,
1243 | 'comment' => 1,
1244 | 'dans' => 1,
1245 | 'des' => 1,
1246 | 'du' => 1,
1247 | 'dedans' => 1,
1248 | 'dehors' => 1,
1249 | 'depuis' => 1,
1250 | 'deux' => 1,
1251 | 'devrait' => 1,
1252 | 'doit' => 1,
1253 | 'donc' => 1,
1254 | 'dos' => 1,
1255 | 'droite' => 1,
1256 | 'début' => 1,
1257 | 'elle' => 1,
1258 | 'elles' => 1,
1259 | 'en' => 1,
1260 | 'encore' => 1,
1261 | 'essai' => 1,
1262 | 'est' => 1,
1263 | 'et' => 1,
1264 | 'eu' => 1,
1265 | 'fait' => 1,
1266 | 'faites' => 1,
1267 | 'fois' => 1,
1268 | 'font' => 1,
1269 | 'force' => 1,
1270 | 'haut' => 1,
1271 | 'hors' => 1,
1272 | 'ici' => 1,
1273 | 'il' => 1,
1274 | 'ils' => 1,
1275 | 'je juste' => 1,
1276 | 'la' => 1,
1277 | 'le' => 1,
1278 | 'les' => 1,
1279 | 'leur' => 1,
1280 | 'là' => 1,
1281 | 'ma' => 1,
1282 | 'maintenant' => 1,
1283 | 'mais' => 1,
1284 | 'mes' => 1,
1285 | 'mine' => 1,
1286 | 'moins' => 1,
1287 | 'mon' => 1,
1288 | 'mot' => 1,
1289 | 'même' => 1,
1290 | 'ni' => 1,
1291 | 'nommés' => 1,
1292 | 'notre' => 1,
1293 | 'nous' => 1,
1294 | 'nouveaux' => 1,
1295 | 'ou' => 1,
1296 | 'où' => 1,
1297 | 'par' => 1,
1298 | 'parce' => 1,
1299 | 'parole' => 1,
1300 | 'pas' => 1,
1301 | 'personnes' => 1,
1302 | 'peut' => 1,
1303 | 'peu' => 1,
1304 | 'pièce' => 1,
1305 | 'plupart' => 1,
1306 | 'pour' => 1,
1307 | 'pourquoi' => 1,
1308 | 'quand' => 1,
1309 | 'que' => 1,
1310 | 'quel' => 1,
1311 | 'quelle' => 1,
1312 | 'quelles' => 1,
1313 | 'quels' => 1,
1314 | 'qui' => 1,
1315 | 'sa' => 1,
1316 | 'sans' => 1,
1317 | 'ses' => 1,
1318 | 'seulement' => 1,
1319 | 'si' => 1,
1320 | 'sien' => 1,
1321 | 'son' => 1,
1322 | 'sont' => 1,
1323 | 'sous' => 1,
1324 | 'soyez' => 1,
1325 | 'sujet' => 1,
1326 | 'sur' => 1,
1327 | 'ta' => 1,
1328 | 'tandis' => 1,
1329 | 'tellement' => 1,
1330 | 'tels' => 1,
1331 | 'tes' => 1,
1332 | 'ton' => 1,
1333 | 'tous' => 1,
1334 | 'tout' => 1,
1335 | 'trop' => 1,
1336 | 'très' => 1,
1337 | 'tu' => 1,
1338 | 'valeur' => 1,
1339 | 'voie' => 1,
1340 | 'voient' => 1,
1341 | 'vont' => 1,
1342 | 'votre' => 1,
1343 | 'vous' => 1,
1344 | 'vu' => 1,
1345 | 'ça' => 1,
1346 | 'étaient' => 1,
1347 | 'état' => 1,
1348 | 'étions' => 1,
1349 | 'été' => 1,
1350 | 'être' => 1,
1351 | ),
1352 | 'german' =>
1353 | array (
1354 | 'ab' => 1,
1355 | 'bei' => 1,
1356 | 'da' => 1,
1357 | 'deshalb' => 1,
1358 | 'ein' => 1,
1359 | 'für' => 1,
1360 | 'haben' => 1,
1361 | 'hier' => 1,
1362 | 'ich' => 1,
1363 | 'ja' => 1,
1364 | 'kann' => 1,
1365 | 'machen' => 1,
1366 | 'muesste' => 1,
1367 | 'nach' => 1,
1368 | 'oder' => 1,
1369 | 'seid' => 1,
1370 | 'sonst' => 1,
1371 | 'und' => 1,
1372 | 'vom' => 1,
1373 | 'wann' => 1,
1374 | 'wenn' => 1,
1375 | 'wie' => 1,
1376 | 'zu' => 1,
1377 | 'bin' => 1,
1378 | 'eines' => 1,
1379 | 'hat' => 1,
1380 | 'manche' => 1,
1381 | 'solches' => 1,
1382 | 'an' => 1,
1383 | 'anderm' => 1,
1384 | 'bis' => 1,
1385 | 'das' => 1,
1386 | 'deinem' => 1,
1387 | 'demselben' => 1,
1388 | 'dir' => 1,
1389 | 'doch' => 1,
1390 | 'einig' => 1,
1391 | 'er' => 1,
1392 | 'eurer' => 1,
1393 | 'hatte' => 1,
1394 | 'ihnen' => 1,
1395 | 'ihre' => 1,
1396 | 'ins' => 1,
1397 | 'jenen' => 1,
1398 | 'keinen' => 1,
1399 | 'manchem' => 1,
1400 | 'meinen' => 1,
1401 | 'nichts' => 1,
1402 | 'seine' => 1,
1403 | 'soll' => 1,
1404 | 'unserm' => 1,
1405 | 'welche' => 1,
1406 | 'werden' => 1,
1407 | 'wollte' => 1,
1408 | 'während' => 1,
1409 | 'alle' => 1,
1410 | 'allem' => 1,
1411 | 'allen' => 1,
1412 | 'aller' => 1,
1413 | 'alles' => 1,
1414 | 'als' => 1,
1415 | 'also' => 1,
1416 | 'am' => 1,
1417 | 'ander' => 1,
1418 | 'andere' => 1,
1419 | 'anderem' => 1,
1420 | 'anderen' => 1,
1421 | 'anderer' => 1,
1422 | 'anderes' => 1,
1423 | 'andern' => 1,
1424 | 'anders' => 1,
1425 | 'auch' => 1,
1426 | 'auf' => 1,
1427 | 'aus' => 1,
1428 | 'bist' => 1,
1429 | 'bsp.' => 1,
1430 | 'daher' => 1,
1431 | 'damit' => 1,
1432 | 'dann' => 1,
1433 | 'dasselbe' => 1,
1434 | 'dazu' => 1,
1435 | 'daß' => 1,
1436 | 'dein' => 1,
1437 | 'deine' => 1,
1438 | 'deinen' => 1,
1439 | 'deiner' => 1,
1440 | 'deines' => 1,
1441 | 'dem' => 1,
1442 | 'den' => 1,
1443 | 'denn' => 1,
1444 | 'denselben' => 1,
1445 | 'der' => 1,
1446 | 'derer' => 1,
1447 | 'derselbe' => 1,
1448 | 'derselben' => 1,
1449 | 'des' => 1,
1450 | 'desselben' => 1,
1451 | 'dessen' => 1,
1452 | 'dich' => 1,
1453 | 'die' => 1,
1454 | 'dies' => 1,
1455 | 'diese' => 1,
1456 | 'dieselbe' => 1,
1457 | 'dieselben' => 1,
1458 | 'diesem' => 1,
1459 | 'diesen' => 1,
1460 | 'dieser' => 1,
1461 | 'dieses' => 1,
1462 | 'dort' => 1,
1463 | 'du' => 1,
1464 | 'durch' => 1,
1465 | 'eine' => 1,
1466 | 'einem' => 1,
1467 | 'einen' => 1,
1468 | 'einer' => 1,
1469 | 'einige' => 1,
1470 | 'einigem' => 1,
1471 | 'einigen' => 1,
1472 | 'einiger' => 1,
1473 | 'einiges' => 1,
1474 | 'einmal' => 1,
1475 | 'es' => 1,
1476 | 'etwas' => 1,
1477 | 'euch' => 1,
1478 | 'euer' => 1,
1479 | 'eure' => 1,
1480 | 'eurem' => 1,
1481 | 'euren' => 1,
1482 | 'eures' => 1,
1483 | 'ganz' => 1,
1484 | 'ganze' => 1,
1485 | 'ganzen' => 1,
1486 | 'ganzer' => 1,
1487 | 'ganzes' => 1,
1488 | 'gegen' => 1,
1489 | 'gemacht' => 1,
1490 | 'gesagt' => 1,
1491 | 'gesehen' => 1,
1492 | 'gewesen' => 1,
1493 | 'gewollt' => 1,
1494 | 'hab' => 1,
1495 | 'habe' => 1,
1496 | 'hatten' => 1,
1497 | 'hin' => 1,
1498 | 'hinter' => 1,
1499 | 'ihm' => 1,
1500 | 'ihn' => 1,
1501 | 'ihr' => 1,
1502 | 'ihrem' => 1,
1503 | 'ihren' => 1,
1504 | 'ihrer' => 1,
1505 | 'ihres' => 1,
1506 | 'im' => 1,
1507 | 'in' => 1,
1508 | 'indem' => 1,
1509 | 'ist' => 1,
1510 | 'jede' => 1,
1511 | 'jedem' => 1,
1512 | 'jeden' => 1,
1513 | 'jeder' => 1,
1514 | 'jedes' => 1,
1515 | 'jene' => 1,
1516 | 'jenem' => 1,
1517 | 'jener' => 1,
1518 | 'jenes' => 1,
1519 | 'jetzt' => 1,
1520 | 'kein' => 1,
1521 | 'keine' => 1,
1522 | 'keinem' => 1,
1523 | 'keiner' => 1,
1524 | 'keines' => 1,
1525 | 'konnte' => 1,
1526 | 'können' => 1,
1527 | 'könnte' => 1,
1528 | 'mache' => 1,
1529 | 'machst' => 1,
1530 | 'macht' => 1,
1531 | 'machte' => 1,
1532 | 'machten' => 1,
1533 | 'man' => 1,
1534 | 'manchen' => 1,
1535 | 'mancher' => 1,
1536 | 'manches' => 1,
1537 | 'mein' => 1,
1538 | 'meine' => 1,
1539 | 'meinem' => 1,
1540 | 'meiner' => 1,
1541 | 'meines' => 1,
1542 | 'mich' => 1,
1543 | 'mir' => 1,
1544 | 'mit' => 1,
1545 | 'muss' => 1,
1546 | 'musste' => 1,
1547 | 'müßt' => 1,
1548 | 'nicht' => 1,
1549 | 'noch' => 1,
1550 | 'nun' => 1,
1551 | 'nur' => 1,
1552 | 'ob' => 1,
1553 | 'ohne' => 1,
1554 | 'sage' => 1,
1555 | 'sagen' => 1,
1556 | 'sagt' => 1,
1557 | 'sagte' => 1,
1558 | 'sagten' => 1,
1559 | 'sagtest' => 1,
1560 | 'sehe' => 1,
1561 | 'sehen' => 1,
1562 | 'sehr' => 1,
1563 | 'seht' => 1,
1564 | 'sein' => 1,
1565 | 'seinem' => 1,
1566 | 'seinen' => 1,
1567 | 'seiner' => 1,
1568 | 'seines' => 1,
1569 | 'selbst' => 1,
1570 | 'sich' => 1,
1571 | 'sicher' => 1,
1572 | 'sie' => 1,
1573 | 'sind' => 1,
1574 | 'so' => 1,
1575 | 'solche' => 1,
1576 | 'solchem' => 1,
1577 | 'solchen' => 1,
1578 | 'solcher' => 1,
1579 | 'sollte' => 1,
1580 | 'sondern' => 1,
1581 | 'um' => 1,
1582 | 'uns' => 1,
1583 | 'unse' => 1,
1584 | 'unsen' => 1,
1585 | 'unser' => 1,
1586 | 'unses' => 1,
1587 | 'unter' => 1,
1588 | 'viel' => 1,
1589 | 'von' => 1,
1590 | 'vor' => 1,
1591 | 'war' => 1,
1592 | 'waren' => 1,
1593 | 'warst' => 1,
1594 | 'was' => 1,
1595 | 'weg' => 1,
1596 | 'weil' => 1,
1597 | 'weiter' => 1,
1598 | 'welchem' => 1,
1599 | 'welchen' => 1,
1600 | 'welcher' => 1,
1601 | 'welches' => 1,
1602 | 'werde' => 1,
1603 | 'wieder' => 1,
1604 | 'will' => 1,
1605 | 'wir' => 1,
1606 | 'wird' => 1,
1607 | 'wirst' => 1,
1608 | 'wo' => 1,
1609 | 'wolle' => 1,
1610 | 'wollen' => 1,
1611 | 'wollt' => 1,
1612 | 'wollten' => 1,
1613 | 'wolltest' => 1,
1614 | 'wolltet' => 1,
1615 | 'würde' => 1,
1616 | 'würden' => 1,
1617 | 'z.B.' => 1,
1618 | 'zum' => 1,
1619 | 'zur' => 1,
1620 | 'zwar' => 1,
1621 | 'zwischen' => 1,
1622 | 'über' => 1,
1623 | 'aber' => 1,
1624 | 'abgerufen' => 1,
1625 | 'abgerufene' => 1,
1626 | 'abgerufener' => 1,
1627 | 'abgerufenes' => 1,
1628 | 'acht' => 1,
1629 | 'allein' => 1,
1630 | 'allerdings' => 1,
1631 | 'allerlei' => 1,
1632 | 'allgemein' => 1,
1633 | 'allmählich' => 1,
1634 | 'allzu' => 1,
1635 | 'alsbald' => 1,
1636 | 'andererseits' => 1,
1637 | 'andernfalls' => 1,
1638 | 'anerkannt' => 1,
1639 | 'anerkannte' => 1,
1640 | 'anerkannter' => 1,
1641 | 'anerkanntes' => 1,
1642 | 'anfangen' => 1,
1643 | 'anfing' => 1,
1644 | 'angefangen' => 1,
1645 | 'angesetze' => 1,
1646 | 'angesetzt' => 1,
1647 | 'angesetzten' => 1,
1648 | 'angesetzter' => 1,
1649 | 'ansetzen' => 1,
1650 | 'anstatt' => 1,
1651 | 'arbeiten' => 1,
1652 | 'aufgehört' => 1,
1653 | 'aufgrund' => 1,
1654 | 'aufhören' => 1,
1655 | 'aufhörte' => 1,
1656 | 'aufzusuchen' => 1,
1657 | 'ausdrücken' => 1,
1658 | 'ausdrückt' => 1,
1659 | 'ausdrückte' => 1,
1660 | 'ausgenommen' => 1,
1661 | 'ausser' => 1,
1662 | 'ausserdem' => 1,
1663 | 'author' => 1,
1664 | 'autor' => 1,
1665 | 'außen' => 1,
1666 | 'außer' => 1,
1667 | 'außerdem' => 1,
1668 | 'außerhalb' => 1,
1669 | 'bald' => 1,
1670 | 'bearbeite' => 1,
1671 | 'bearbeiten' => 1,
1672 | 'bearbeitete' => 1,
1673 | 'bearbeiteten' => 1,
1674 | 'bedarf' => 1,
1675 | 'bedurfte' => 1,
1676 | 'bedürfen' => 1,
1677 | 'befragen' => 1,
1678 | 'befragte' => 1,
1679 | 'befragten' => 1,
1680 | 'befragter' => 1,
1681 | 'begann' => 1,
1682 | 'beginnen' => 1,
1683 | 'begonnen' => 1,
1684 | 'behalten' => 1,
1685 | 'behielt' => 1,
1686 | 'beide' => 1,
1687 | 'beiden' => 1,
1688 | 'beiderlei' => 1,
1689 | 'beides' => 1,
1690 | 'beim' => 1,
1691 | 'beinahe' => 1,
1692 | 'beitragen' => 1,
1693 | 'beitrugen' => 1,
1694 | 'bekannt' => 1,
1695 | 'bekannte' => 1,
1696 | 'bekannter' => 1,
1697 | 'bekennen' => 1,
1698 | 'benutzt' => 1,
1699 | 'bereits' => 1,
1700 | 'berichten' => 1,
1701 | 'berichtet' => 1,
1702 | 'berichtete' => 1,
1703 | 'berichteten' => 1,
1704 | 'besonders' => 1,
1705 | 'besser' => 1,
1706 | 'bestehen' => 1,
1707 | 'besteht' => 1,
1708 | 'beträchtlich' => 1,
1709 | 'bevor' => 1,
1710 | 'bezüglich' => 1,
1711 | 'bietet' => 1,
1712 | 'bisher' => 1,
1713 | 'bislang' => 1,
1714 | 'bleiben' => 1,
1715 | 'blieb' => 1,
1716 | 'bloss' => 1,
1717 | 'bloß' => 1,
1718 | 'brachte' => 1,
1719 | 'brachten' => 1,
1720 | 'brauchen' => 1,
1721 | 'braucht' => 1,
1722 | 'bringen' => 1,
1723 | 'bräuchte' => 1,
1724 | 'bzw' => 1,
1725 | 'böden' => 1,
1726 | 'ca.' => 1,
1727 | 'dabei' => 1,
1728 | 'dadurch' => 1,
1729 | 'dafür' => 1,
1730 | 'dagegen' => 1,
1731 | 'dahin' => 1,
1732 | 'damals' => 1,
1733 | 'danach' => 1,
1734 | 'daneben' => 1,
1735 | 'dank' => 1,
1736 | 'danke' => 1,
1737 | 'danken' => 1,
1738 | 'dannen' => 1,
1739 | 'daran' => 1,
1740 | 'darauf' => 1,
1741 | 'daraus' => 1,
1742 | 'darf' => 1,
1743 | 'darfst' => 1,
1744 | 'darin' => 1,
1745 | 'darum' => 1,
1746 | 'darunter' => 1,
1747 | 'darüber' => 1,
1748 | 'darüberhinaus' => 1,
1749 | 'dass' => 1,
1750 | 'davon' => 1,
1751 | 'davor' => 1,
1752 | 'demnach' => 1,
1753 | 'denen' => 1,
1754 | 'dennoch' => 1,
1755 | 'derart' => 1,
1756 | 'derartig' => 1,
1757 | 'derem' => 1,
1758 | 'deren' => 1,
1759 | 'derjenige' => 1,
1760 | 'derjenigen' => 1,
1761 | 'derzeit' => 1,
1762 | 'desto' => 1,
1763 | 'deswegen' => 1,
1764 | 'diejenige' => 1,
1765 | 'diesseits' => 1,
1766 | 'dinge' => 1,
1767 | 'direkt' => 1,
1768 | 'direkte' => 1,
1769 | 'direkten' => 1,
1770 | 'direkter' => 1,
1771 | 'doppelt' => 1,
1772 | 'dorther' => 1,
1773 | 'dorthin' => 1,
1774 | 'drauf' => 1,
1775 | 'drei' => 1,
1776 | 'dreißig' => 1,
1777 | 'drin' => 1,
1778 | 'dritte' => 1,
1779 | 'drunter' => 1,
1780 | 'drüber' => 1,
1781 | 'dunklen' => 1,
1782 | 'durchaus' => 1,
1783 | 'durfte' => 1,
1784 | 'durften' => 1,
1785 | 'dürfen' => 1,
1786 | 'dürfte' => 1,
1787 | 'eben' => 1,
1788 | 'ebenfalls' => 1,
1789 | 'ebenso' => 1,
1790 | 'ehe' => 1,
1791 | 'eher' => 1,
1792 | 'eigenen' => 1,
1793 | 'eigenes' => 1,
1794 | 'eigentlich' => 1,
1795 | 'einbaün' => 1,
1796 | 'einerseits' => 1,
1797 | 'einfach' => 1,
1798 | 'einführen' => 1,
1799 | 'einführte' => 1,
1800 | 'einführten' => 1,
1801 | 'eingesetzt' => 1,
1802 | 'einigermaßen' => 1,
1803 | 'eins' => 1,
1804 | 'einseitig' => 1,
1805 | 'einseitige' => 1,
1806 | 'einseitigen' => 1,
1807 | 'einseitiger' => 1,
1808 | 'einst' => 1,
1809 | 'einstmals' => 1,
1810 | 'einzig' => 1,
1811 | 'ende' => 1,
1812 | 'entsprechend' => 1,
1813 | 'entweder' => 1,
1814 | 'ergänze' => 1,
1815 | 'ergänzen' => 1,
1816 | 'ergänzte' => 1,
1817 | 'ergänzten' => 1,
1818 | 'erhalten' => 1,
1819 | 'erhielt' => 1,
1820 | 'erhielten' => 1,
1821 | 'erhält' => 1,
1822 | 'erneut' => 1,
1823 | 'erst' => 1,
1824 | 'erste' => 1,
1825 | 'ersten' => 1,
1826 | 'erster' => 1,
1827 | 'eröffne' => 1,
1828 | 'eröffnen' => 1,
1829 | 'eröffnet' => 1,
1830 | 'eröffnete' => 1,
1831 | 'eröffnetes' => 1,
1832 | 'etc' => 1,
1833 | 'etliche' => 1,
1834 | 'etwa' => 1,
1835 | 'fall' => 1,
1836 | 'falls' => 1,
1837 | 'fand' => 1,
1838 | 'fast' => 1,
1839 | 'ferner' => 1,
1840 | 'finden' => 1,
1841 | 'findest' => 1,
1842 | 'findet' => 1,
1843 | 'folgende' => 1,
1844 | 'folgenden' => 1,
1845 | 'folgender' => 1,
1846 | 'folgendes' => 1,
1847 | 'folglich' => 1,
1848 | 'fordern' => 1,
1849 | 'fordert' => 1,
1850 | 'forderte' => 1,
1851 | 'forderten' => 1,
1852 | 'fortsetzen' => 1,
1853 | 'fortsetzt' => 1,
1854 | 'fortsetzte' => 1,
1855 | 'fortsetzten' => 1,
1856 | 'fragte' => 1,
1857 | 'frau' => 1,
1858 | 'frei' => 1,
1859 | 'freie' => 1,
1860 | 'freier' => 1,
1861 | 'freies' => 1,
1862 | 'fuer' => 1,
1863 | 'fünf' => 1,
1864 | 'gab' => 1,
1865 | 'ganzem' => 1,
1866 | 'gar' => 1,
1867 | 'gbr' => 1,
1868 | 'geb' => 1,
1869 | 'geben' => 1,
1870 | 'geblieben' => 1,
1871 | 'gebracht' => 1,
1872 | 'gedurft' => 1,
1873 | 'geehrt' => 1,
1874 | 'geehrte' => 1,
1875 | 'geehrten' => 1,
1876 | 'geehrter' => 1,
1877 | 'gefallen' => 1,
1878 | 'gefiel' => 1,
1879 | 'gefälligst' => 1,
1880 | 'gefällt' => 1,
1881 | 'gegeben' => 1,
1882 | 'gehabt' => 1,
1883 | 'gehen' => 1,
1884 | 'geht' => 1,
1885 | 'gekommen' => 1,
1886 | 'gekonnt' => 1,
1887 | 'gemocht' => 1,
1888 | 'gemäss' => 1,
1889 | 'genommen' => 1,
1890 | 'genug' => 1,
1891 | 'gern' => 1,
1892 | 'gestern' => 1,
1893 | 'gestrige' => 1,
1894 | 'getan' => 1,
1895 | 'geteilt' => 1,
1896 | 'geteilte' => 1,
1897 | 'getragen' => 1,
1898 | 'gewissermaßen' => 1,
1899 | 'geworden' => 1,
1900 | 'ggf' => 1,
1901 | 'gib' => 1,
1902 | 'gibt' => 1,
1903 | 'gleich' => 1,
1904 | 'gleichwohl' => 1,
1905 | 'gleichzeitig' => 1,
1906 | 'glücklicherweise' => 1,
1907 | 'gmbh' => 1,
1908 | 'gratulieren' => 1,
1909 | 'gratuliert' => 1,
1910 | 'gratulierte' => 1,
1911 | 'gute' => 1,
1912 | 'guten' => 1,
1913 | 'gängig' => 1,
1914 | 'gängige' => 1,
1915 | 'gängigen' => 1,
1916 | 'gängiger' => 1,
1917 | 'gängiges' => 1,
1918 | 'gänzlich' => 1,
1919 | 'haette' => 1,
1920 | 'halb' => 1,
1921 | 'hallo' => 1,
1922 | 'hast' => 1,
1923 | 'hattest' => 1,
1924 | 'hattet' => 1,
1925 | 'heraus' => 1,
1926 | 'herein' => 1,
1927 | 'heute' => 1,
1928 | 'heutige' => 1,
1929 | 'hiermit' => 1,
1930 | 'hiesige' => 1,
1931 | 'hinein' => 1,
1932 | 'hinten' => 1,
1933 | 'hinterher' => 1,
1934 | 'hoch' => 1,
1935 | 'hundert' => 1,
1936 | 'hätt' => 1,
1937 | 'hätte' => 1,
1938 | 'hätten' => 1,
1939 | 'höchstens' => 1,
1940 | 'igitt' => 1,
1941 | 'immer' => 1,
1942 | 'immerhin' => 1,
1943 | 'important' => 1,
1944 | 'indessen' => 1,
1945 | 'info' => 1,
1946 | 'infolge' => 1,
1947 | 'innen' => 1,
1948 | 'innerhalb' => 1,
1949 | 'insofern' => 1,
1950 | 'inzwischen' => 1,
1951 | 'irgend' => 1,
1952 | 'irgendeine' => 1,
1953 | 'irgendwas' => 1,
1954 | 'irgendwen' => 1,
1955 | 'irgendwer' => 1,
1956 | 'irgendwie' => 1,
1957 | 'irgendwo' => 1,
1958 | 'je' => 1,
1959 | 'jedenfalls' => 1,
1960 | 'jederlei' => 1,
1961 | 'jedoch' => 1,
1962 | 'jemand' => 1,
1963 | 'jenseits' => 1,
1964 | 'jährig' => 1,
1965 | 'jährige' => 1,
1966 | 'jährigen' => 1,
1967 | 'jähriges' => 1,
1968 | 'kam' => 1,
1969 | 'kannst' => 1,
1970 | 'kaum' => 1,
1971 | 'keinerlei' => 1,
1972 | 'keineswegs' => 1,
1973 | 'klar' => 1,
1974 | 'klare' => 1,
1975 | 'klaren' => 1,
1976 | 'klares' => 1,
1977 | 'klein' => 1,
1978 | 'kleinen' => 1,
1979 | 'kleiner' => 1,
1980 | 'kleines' => 1,
1981 | 'koennen' => 1,
1982 | 'koennt' => 1,
1983 | 'koennte' => 1,
1984 | 'koennten' => 1,
1985 | 'komme' => 1,
1986 | 'kommen' => 1,
1987 | 'kommt' => 1,
1988 | 'konkret' => 1,
1989 | 'konkrete' => 1,
1990 | 'konkreten' => 1,
1991 | 'konkreter' => 1,
1992 | 'konkretes' => 1,
1993 | 'konnten' => 1,
1994 | 'könn' => 1,
1995 | 'könnt' => 1,
1996 | 'könnten' => 1,
1997 | 'künftig' => 1,
1998 | 'lag' => 1,
1999 | 'lagen' => 1,
2000 | 'langsam' => 1,
2001 | 'lassen' => 1,
2002 | 'laut' => 1,
2003 | 'lediglich' => 1,
2004 | 'leer' => 1,
2005 | 'legen' => 1,
2006 | 'legte' => 1,
2007 | 'legten' => 1,
2008 | 'leicht' => 1,
2009 | 'leider' => 1,
2010 | 'lesen' => 1,
2011 | 'letze' => 1,
2012 | 'letzten' => 1,
2013 | 'letztendlich' => 1,
2014 | 'letztens' => 1,
2015 | 'letztes' => 1,
2016 | 'letztlich' => 1,
2017 | 'lichten' => 1,
2018 | 'liegt' => 1,
2019 | 'liest' => 1,
2020 | 'links' => 1,
2021 | 'längst' => 1,
2022 | 'längstens' => 1,
2023 | 'mag' => 1,
2024 | 'magst' => 1,
2025 | 'mal' => 1,
2026 | 'mancherorts' => 1,
2027 | 'manchmal' => 1,
2028 | 'mann' => 1,
2029 | 'margin' => 1,
2030 | 'mehr' => 1,
2031 | 'mehrere' => 1,
2032 | 'meist' => 1,
2033 | 'meiste' => 1,
2034 | 'meisten' => 1,
2035 | 'meta' => 1,
2036 | 'mindestens' => 1,
2037 | 'mithin' => 1,
2038 | 'mochte' => 1,
2039 | 'morgen' => 1,
2040 | 'morgige' => 1,
2041 | 'muessen' => 1,
2042 | 'muesst' => 1,
2043 | 'musst' => 1,
2044 | 'mussten' => 1,
2045 | 'muß' => 1,
2046 | 'mußt' => 1,
2047 | 'möchte' => 1,
2048 | 'möchten' => 1,
2049 | 'möchtest' => 1,
2050 | 'mögen' => 1,
2051 | 'möglich' => 1,
2052 | 'mögliche' => 1,
2053 | 'möglichen' => 1,
2054 | 'möglicher' => 1,
2055 | 'möglicherweise' => 1,
2056 | 'müssen' => 1,
2057 | 'müsste' => 1,
2058 | 'müssten' => 1,
2059 | 'müßte' => 1,
2060 | 'nachdem' => 1,
2061 | 'nacher' => 1,
2062 | 'nachhinein' => 1,
2063 | 'nahm' => 1,
2064 | 'natürlich' => 1,
2065 | 'nacht' => 1,
2066 | 'neben' => 1,
2067 | 'nebenan' => 1,
2068 | 'nehmen' => 1,
2069 | 'nein' => 1,
2070 | 'neu' => 1,
2071 | 'neue' => 1,
2072 | 'neuem' => 1,
2073 | 'neuen' => 1,
2074 | 'neuer' => 1,
2075 | 'neues' => 1,
2076 | 'neun' => 1,
2077 | 'nie' => 1,
2078 | 'niemals' => 1,
2079 | 'niemand' => 1,
2080 | 'nimm' => 1,
2081 | 'nimmer' => 1,
2082 | 'nimmt' => 1,
2083 | 'nirgends' => 1,
2084 | 'nirgendwo' => 1,
2085 | 'nutzen' => 1,
2086 | 'nutzt' => 1,
2087 | 'nutzung' => 1,
2088 | 'nächste' => 1,
2089 | 'nämlich' => 1,
2090 | 'nötigenfalls' => 1,
2091 | 'nützt' => 1,
2092 | 'oben' => 1,
2093 | 'oberhalb' => 1,
2094 | 'obgleich' => 1,
2095 | 'obschon' => 1,
2096 | 'obwohl' => 1,
2097 | 'oft' => 1,
2098 | 'paar' => 1,
2099 | 'per' => 1,
2100 | 'pfui' => 1,
2101 | 'plötzlich' => 1,
2102 | 'pro' => 1,
2103 | 'reagiere' => 1,
2104 | 'reagieren' => 1,
2105 | 'reagiert' => 1,
2106 | 'reagierte' => 1,
2107 | 'rechts' => 1,
2108 | 'regelmäßig' => 1,
2109 | 'rief' => 1,
2110 | 'rund' => 1,
2111 | 'sang' => 1,
2112 | 'sangen' => 1,
2113 | 'schlechter' => 1,
2114 | 'schließlich' => 1,
2115 | 'schnell' => 1,
2116 | 'schon' => 1,
2117 | 'schreibe' => 1,
2118 | 'schreiben' => 1,
2119 | 'schreibens' => 1,
2120 | 'schreiber' => 1,
2121 | 'schwierig' => 1,
2122 | 'schätzen' => 1,
2123 | 'schätzt' => 1,
2124 | 'schätzte' => 1,
2125 | 'schätzten' => 1,
2126 | 'sechs' => 1,
2127 | 'sect' => 1,
2128 | 'sehrwohl' => 1,
2129 | 'sei' => 1,
2130 | 'seit' => 1,
2131 | 'seitdem' => 1,
2132 | 'seite' => 1,
2133 | 'seiten' => 1,
2134 | 'seither' => 1,
2135 | 'selber' => 1,
2136 | 'senke' => 1,
2137 | 'senken' => 1,
2138 | 'senkt' => 1,
2139 | 'senkte' => 1,
2140 | 'senkten' => 1,
2141 | 'setzen' => 1,
2142 | 'setzt' => 1,
2143 | 'setzte' => 1,
2144 | 'setzten' => 1,
2145 | 'sicherlich' => 1,
2146 | 'sieben' => 1,
2147 | 'siebte' => 1,
2148 | 'siehe' => 1,
2149 | 'sieht' => 1,
2150 | 'singen' => 1,
2151 | 'singt' => 1,
2152 | 'sobald' => 1,
2153 | 'sodaß' => 1,
2154 | 'soeben' => 1,
2155 | 'sofern' => 1,
2156 | 'sofort' => 1,
2157 | 'sog' => 1,
2158 | 'sogar' => 1,
2159 | 'solange' => 1,
2160 | 'solc hen' => 1,
2161 | 'solch' => 1,
2162 | 'sollen' => 1,
2163 | 'sollst' => 1,
2164 | 'sollt' => 1,
2165 | 'sollten' => 1,
2166 | 'solltest' => 1,
2167 | 'somit' => 1,
2168 | 'sonstwo' => 1,
2169 | 'sooft' => 1,
2170 | 'soviel' => 1,
2171 | 'soweit' => 1,
2172 | 'sowie' => 1,
2173 | 'sowohl' => 1,
2174 | 'spielen' => 1,
2175 | 'später' => 1,
2176 | 'startet' => 1,
2177 | 'startete' => 1,
2178 | 'starteten' => 1,
2179 | 'statt' => 1,
2180 | 'stattdessen' => 1,
2181 | 'steht' => 1,
2182 | 'steige' => 1,
2183 | 'steigen' => 1,
2184 | 'steigt' => 1,
2185 | 'stets' => 1,
2186 | 'stieg' => 1,
2187 | 'stiegen' => 1,
2188 | 'such' => 1,
2189 | 'suchen' => 1,
2190 | 'sämtliche' => 1,
2191 | 'tages' => 1,
2192 | 'tat' => 1,
2193 | 'tatsächlich' => 1,
2194 | 'tatsächlichen' => 1,
2195 | 'tatsächlicher' => 1,
2196 | 'tatsächliches' => 1,
2197 | 'tausend' => 1,
2198 | 'teile' => 1,
2199 | 'teilen' => 1,
2200 | 'teilte' => 1,
2201 | 'teilten' => 1,
2202 | 'titel' => 1,
2203 | 'total' => 1,
2204 | 'trage' => 1,
2205 | 'tragen' => 1,
2206 | 'trotzdem' => 1,
2207 | 'trug' => 1,
2208 | 'trägt' => 1,
2209 | 'tun' => 1,
2210 | 'tust' => 1,
2211 | 'tut' => 1,
2212 | 'txt' => 1,
2213 | 'tät' => 1,
2214 | 'ueber' => 1,
2215 | 'umso' => 1,
2216 | 'unbedingt' => 1,
2217 | 'ungefähr' => 1,
2218 | 'unmöglich' => 1,
2219 | 'unmögliche' => 1,
2220 | 'unmöglichen' => 1,
2221 | 'unmöglicher' => 1,
2222 | 'unnötig' => 1,
2223 | 'unsem' => 1,
2224 | 'unsere' => 1,
2225 | 'unserem' => 1,
2226 | 'unseren' => 1,
2227 | 'unserer' => 1,
2228 | 'unseres' => 1,
2229 | 'unten' => 1,
2230 | 'unterbrach' => 1,
2231 | 'unterbrechen' => 1,
2232 | 'unterhalb' => 1,
2233 | 'unwichtig' => 1,
2234 | 'usw' => 1,
2235 | 'vergangen' => 1,
2236 | 'vergangene' => 1,
2237 | 'vergangener' => 1,
2238 | 'vergangenes' => 1,
2239 | 'vermag' => 1,
2240 | 'vermutlich' => 1,
2241 | 'vermögen' => 1,
2242 | 'verrate' => 1,
2243 | 'verraten' => 1,
2244 | 'verriet' => 1,
2245 | 'verrieten' => 1,
2246 | 'version' => 1,
2247 | 'versorge' => 1,
2248 | 'versorgen' => 1,
2249 | 'versorgt' => 1,
2250 | 'versorgte' => 1,
2251 | 'versorgten' => 1,
2252 | 'versorgtes' => 1,
2253 | 'veröffentlichen' => 1,
2254 | 'veröffentlicher' => 1,
2255 | 'veröffentlicht' => 1,
2256 | 'veröffentlichte' => 1,
2257 | 'veröffentlichten' => 1,
2258 | 'veröffentlichtes' => 1,
2259 | 'viele' => 1,
2260 | 'vielen' => 1,
2261 | 'vieler' => 1,
2262 | 'vieles' => 1,
2263 | 'vielleicht' => 1,
2264 | 'vielmals' => 1,
2265 | 'vier' => 1,
2266 | 'vollständig' => 1,
2267 | 'voran' => 1,
2268 | 'vorbei' => 1,
2269 | 'vorgestern' => 1,
2270 | 'vorher' => 1,
2271 | 'vorne' => 1,
2272 | 'vorüber' => 1,
2273 | 'völlig' => 1,
2274 | 'wachen' => 1,
2275 | 'waere' => 1,
2276 | 'warum' => 1,
2277 | 'weder' => 1,
2278 | 'wegen' => 1,
2279 | 'weitere' => 1,
2280 | 'weiterem' => 1,
2281 | 'weiteren' => 1,
2282 | 'weiterer' => 1,
2283 | 'weiteres' => 1,
2284 | 'weiterhin' => 1,
2285 | 'weiß' => 1,
2286 | 'wem' => 1,
2287 | 'wen' => 1,
2288 | 'wenig' => 1,
2289 | 'wenige' => 1,
2290 | 'weniger' => 1,
2291 | 'wenigstens' => 1,
2292 | 'wenngleich' => 1,
2293 | 'wer' => 1,
2294 | 'werdet' => 1,
2295 | 'weshalb' => 1,
2296 | 'wessen' => 1,
2297 | 'wichtig' => 1,
2298 | 'wieso' => 1,
2299 | 'wieviel' => 1,
2300 | 'wiewohl' => 1,
2301 | 'willst' => 1,
2302 | 'wirklich' => 1,
2303 | 'wodurch' => 1,
2304 | 'wogegen' => 1,
2305 | 'woher' => 1,
2306 | 'wohin' => 1,
2307 | 'wohingegen' => 1,
2308 | 'wohl' => 1,
2309 | 'wohlweislich' => 1,
2310 | 'womit' => 1,
2311 | 'woraufhin' => 1,
2312 | 'woraus' => 1,
2313 | 'worin' => 1,
2314 | 'wurde' => 1,
2315 | 'wurden' => 1,
2316 | 'währenddessen' => 1,
2317 | 'wär' => 1,
2318 | 'wäre' => 1,
2319 | 'wären' => 1,
2320 | 'zahlreich' => 1,
2321 | 'zehn' => 1,
2322 | 'zeitweise' => 1,
2323 | 'ziehen' => 1,
2324 | 'zieht' => 1,
2325 | 'zog' => 1,
2326 | 'zogen' => 1,
2327 | 'zudem' => 1,
2328 | 'zuerst' => 1,
2329 | 'zufolge' => 1,
2330 | 'zugleich' => 1,
2331 | 'zuletzt' => 1,
2332 | 'zumal' => 1,
2333 | 'zurück' => 1,
2334 | 'zusammen' => 1,
2335 | 'zuviel' => 1,
2336 | 'zwanzig' => 1,
2337 | 'zwei' => 1,
2338 | 'zwölf' => 1,
2339 | 'ähnlich' => 1,
2340 | 'übel' => 1,
2341 | 'überall' => 1,
2342 | 'überallhin' => 1,
2343 | 'überdies' => 1,
2344 | 'übermorgen' => 1,
2345 | 'übrig' => 1,
2346 | 'übrigens' => 1,
2347 | ),
2348 | 'hungarian' =>
2349 | array (
2350 | 'a' => 1,
2351 | 'az' => 1,
2352 | 'egy' => 1,
2353 | 'be' => 1,
2354 | 'ki' => 1,
2355 | 'le' => 1,
2356 | 'fel' => 1,
2357 | 'meg' => 1,
2358 | 'el' => 1,
2359 | 'át' => 1,
2360 | 'rá' => 1,
2361 | 'ide oda' => 1,
2362 | 'szét' => 1,
2363 | 'össze' => 1,
2364 | 'vissza' => 1,
2365 | 'de' => 1,
2366 | 'hát' => 1,
2367 | 'és' => 1,
2368 | 'vagy' => 1,
2369 | 'hogy' => 1,
2370 | 'van' => 1,
2371 | 'lesz' => 1,
2372 | 'volt csak' => 1,
2373 | 'nem' => 1,
2374 | 'igen' => 1,
2375 | 'mint' => 1,
2376 | 'én' => 1,
2377 | 'te' => 1,
2378 | 'õ' => 1,
2379 | 'mi' => 1,
2380 | 'ti' => 1,
2381 | 'õk' => 1,
2382 | 'ön' => 1,
2383 | ),
2384 | 'italian' =>
2385 | array (
2386 | 'a' => 1,
2387 | 'adesso' => 1,
2388 | 'ai' => 1,
2389 | 'al' => 1,
2390 | 'alla' => 1,
2391 | 'allo' => 1,
2392 | 'allora' => 1,
2393 | 'altre' => 1,
2394 | 'altri' => 1,
2395 | 'altro' => 1,
2396 | 'anche' => 1,
2397 | 'ancora' => 1,
2398 | 'avere' => 1,
2399 | 'aveva' => 1,
2400 | 'avevano' => 1,
2401 | 'ben' => 1,
2402 | 'buono' => 1,
2403 | 'che' => 1,
2404 | 'chi' => 1,
2405 | 'cinque' => 1,
2406 | 'comprare' => 1,
2407 | 'con' => 1,
2408 | 'consecutivi' => 1,
2409 | 'consecutivo' => 1,
2410 | 'cosa' => 1,
2411 | 'cui' => 1,
2412 | 'da' => 1,
2413 | 'del' => 1,
2414 | 'della' => 1,
2415 | 'delle' => 1,
2416 | 'dentro' => 1,
2417 | 'deve' => 1,
2418 | 'devo' => 1,
2419 | 'di' => 1,
2420 | 'doppio' => 1,
2421 | 'due' => 1,
2422 | 'e' => 1,
2423 | 'ecco' => 1,
2424 | 'fare' => 1,
2425 | 'fine' => 1,
2426 | 'fino' => 1,
2427 | 'fra' => 1,
2428 | 'gente' => 1,
2429 | 'giu' => 1,
2430 | 'ha' => 1,
2431 | 'hai' => 1,
2432 | 'hanno' => 1,
2433 | 'ho' => 1,
2434 | 'il' => 1,
2435 | 'indietro invece' => 1,
2436 | 'io' => 1,
2437 | 'la' => 1,
2438 | 'lavoro' => 1,
2439 | 'le' => 1,
2440 | 'lei' => 1,
2441 | 'lo' => 1,
2442 | 'loro' => 1,
2443 | 'lui' => 1,
2444 | 'lungo' => 1,
2445 | 'ma' => 1,
2446 | 'me' => 1,
2447 | 'meglio' => 1,
2448 | 'molta' => 1,
2449 | 'molti' => 1,
2450 | 'molto' => 1,
2451 | 'nei' => 1,
2452 | 'nel' => 1,
2453 | 'nella' => 1,
2454 | 'nelle' => 1,
2455 | 'no' => 1,
2456 | 'noi' => 1,
2457 | 'nome' => 1,
2458 | 'nostro' => 1,
2459 | 'nove' => 1,
2460 | 'nuovi' => 1,
2461 | 'nuovo' => 1,
2462 | 'o' => 1,
2463 | 'oltre' => 1,
2464 | 'ora' => 1,
2465 | 'otto' => 1,
2466 | 'peggio' => 1,
2467 | 'pero' => 1,
2468 | 'persone' => 1,
2469 | 'piu' => 1,
2470 | 'poco' => 1,
2471 | 'primo' => 1,
2472 | 'promesso' => 1,
2473 | 'qua' => 1,
2474 | 'quarto' => 1,
2475 | 'quasi' => 1,
2476 | 'quattro' => 1,
2477 | 'quello' => 1,
2478 | 'questo' => 1,
2479 | 'qui' => 1,
2480 | 'quindi' => 1,
2481 | 'quinto' => 1,
2482 | 'rispetto' => 1,
2483 | 'sara' => 1,
2484 | 'secondo' => 1,
2485 | 'sei' => 1,
2486 | 'sembra sembrava' => 1,
2487 | 'senza' => 1,
2488 | 'sette' => 1,
2489 | 'sia' => 1,
2490 | 'siamo' => 1,
2491 | 'siete' => 1,
2492 | 'solo' => 1,
2493 | 'sono' => 1,
2494 | 'sopra' => 1,
2495 | 'soprattutto' => 1,
2496 | 'tutte' => 1,
2497 | 'tutto' => 1,
2498 | 'sotto' => 1,
2499 | 'stati' => 1,
2500 | 'stato' => 1,
2501 | 'stesso' => 1,
2502 | 'su' => 1,
2503 | 'subito' => 1,
2504 | 'sul' => 1,
2505 | 'sulla' => 1,
2506 | 'tanto' => 1,
2507 | 'te' => 1,
2508 | 'tempo' => 1,
2509 | 'terzo' => 1,
2510 | 'tra' => 1,
2511 | 'tre' => 1,
2512 | 'triplo' => 1,
2513 | 'ultimo' => 1,
2514 | 'un' => 1,
2515 | 'una' => 1,
2516 | 'uno' => 1,
2517 | 'va' => 1,
2518 | 'vai' => 1,
2519 | 'voi' => 1,
2520 | 'volte' => 1,
2521 | 'vostro' => 1,
2522 | ),
2523 | 'norwegian' =>
2524 | array (
2525 | 'alle' => 1,
2526 | 'andre' => 1,
2527 | 'arbeid' => 1,
2528 | 'av' => 1,
2529 | 'begge' => 1,
2530 | 'bort' => 1,
2531 | 'bra' => 1,
2532 | 'bruke' => 1,
2533 | 'da' => 1,
2534 | 'denne' => 1,
2535 | 'der' => 1,
2536 | 'deres' => 1,
2537 | 'det' => 1,
2538 | 'din' => 1,
2539 | 'disse' => 1,
2540 | 'du' => 1,
2541 | 'eller' => 1,
2542 | 'en' => 1,
2543 | 'ene' => 1,
2544 | 'eneste' => 1,
2545 | 'enhver' => 1,
2546 | 'enn' => 1,
2547 | 'er' => 1,
2548 | 'et' => 1,
2549 | 'folk' => 1,
2550 | 'for' => 1,
2551 | 'fordi' => 1,
2552 | 'forsÛke' => 1,
2553 | 'fra' => 1,
2554 | 'fÅ' => 1,
2555 | 'fÛr' => 1,
2556 | 'fÛrst' => 1,
2557 | 'gjorde' => 1,
2558 | 'gjÛre' => 1,
2559 | 'god' => 1,
2560 | 'gÅ' => 1,
2561 | 'ha' => 1,
2562 | 'hadde' => 1,
2563 | 'han' => 1,
2564 | 'hans' => 1,
2565 | 'hennes' => 1,
2566 | 'her' => 1,
2567 | 'hva' => 1,
2568 | 'hvem' => 1,
2569 | 'hver' => 1,
2570 | 'hvilken' => 1,
2571 | 'hvis' => 1,
2572 | 'hvor' => 1,
2573 | 'hvordan' => 1,
2574 | 'hvorfor' => 1,
2575 | 'i' => 1,
2576 | 'ikke' => 1,
2577 | 'inn' => 1,
2578 | 'innen' => 1,
2579 | 'kan' => 1,
2580 | 'kunne' => 1,
2581 | 'lage' => 1,
2582 | 'lang' => 1,
2583 | 'lik' => 1,
2584 | 'like' => 1,
2585 | 'makt' => 1,
2586 | 'mange' => 1,
2587 | 'med' => 1,
2588 | 'meg' => 1,
2589 | 'meget' => 1,
2590 | 'men' => 1,
2591 | 'mens' => 1,
2592 | 'mer' => 1,
2593 | 'mest' => 1,
2594 | 'min' => 1,
2595 | 'mye' => 1,
2596 | 'mÅ' => 1,
2597 | 'mÅte' => 1,
2598 | 'navn' => 1,
2599 | 'nei' => 1,
2600 | 'ny' => 1,
2601 | 'nÅ' => 1,
2602 | 'nÅr' => 1,
2603 | 'og' => 1,
2604 | 'ogsÅ' => 1,
2605 | 'om' => 1,
2606 | 'opp' => 1,
2607 | 'oss' => 1,
2608 | 'over' => 1,
2609 | 'part' => 1,
2610 | 'punkt' => 1,
2611 | 'pÅ' => 1,
2612 | 'rett' => 1,
2613 | 'riktig' => 1,
2614 | 'samme' => 1,
2615 | 'sant' => 1,
2616 | 'si' => 1,
2617 | 'siden' => 1,
2618 | 'sist' => 1,
2619 | 'skulle' => 1,
2620 | 'slik' => 1,
2621 | 'slutt' => 1,
2622 | 'som' => 1,
2623 | 'start' => 1,
2624 | 'stille' => 1,
2625 | 'sÅ' => 1,
2626 | 'tid' => 1,
2627 | 'til' => 1,
2628 | 'tilbake' => 1,
2629 | 'tilstand' => 1,
2630 | 'under' => 1,
2631 | 'ut' => 1,
2632 | 'uten' => 1,
2633 | 'var' => 1,
2634 | 'ved' => 1,
2635 | 'verdi' => 1,
2636 | 'vi' => 1,
2637 | 'vil' => 1,
2638 | 'ville' => 1,
2639 | 'vite' => 1,
2640 | 'vÅr' => 1,
2641 | 'vÖre' => 1,
2642 | 'vÖrt' => 1,
2643 | 'Å' => 1,
2644 | ),
2645 | 'polish' =>
2646 | array (
2647 | 'a' => 1,
2648 | 'aby' => 1,
2649 | 'ach' => 1,
2650 | 'acz' => 1,
2651 | 'aczkolwiek' => 1,
2652 | 'aj' => 1,
2653 | 'albo' => 1,
2654 | 'ale' => 1,
2655 | 'ależ' => 1,
2656 | 'aż' => 1,
2657 | 'bardziej' => 1,
2658 | 'bardzo' => 1,
2659 | 'bez' => 1,
2660 | 'bo' => 1,
2661 | 'bowiem' => 1,
2662 | 'by' => 1,
2663 | 'byli' => 1,
2664 | 'bynajmniej' => 1,
2665 | 'być' => 1,
2666 | 'był' => 1,
2667 | 'była' => 1,
2668 | 'było' => 1,
2669 | 'były' => 1,
2670 | 'będzie' => 1,
2671 | 'będą' => 1,
2672 | 'cali' => 1,
2673 | 'cała' => 1,
2674 | 'cały' => 1,
2675 | 'ci' => 1,
2676 | 'cię' => 1,
2677 | 'ciebie' => 1,
2678 | 'co' => 1,
2679 | 'cokolwiek' => 1,
2680 | 'coś' => 1,
2681 | 'czasami' => 1,
2682 | 'czasem' => 1,
2683 | 'czemu' => 1,
2684 | 'czy' => 1,
2685 | 'czyli' => 1,
2686 | 'daleko' => 1,
2687 | 'dla' => 1,
2688 | 'dlaczego' => 1,
2689 | 'dlatego' => 1,
2690 | 'do' => 1,
2691 | 'dobrze' => 1,
2692 | 'dokąd' => 1,
2693 | 'dość' => 1,
2694 | 'dużo' => 1,
2695 | 'dwa' => 1,
2696 | 'dwaj' => 1,
2697 | 'dwie' => 1,
2698 | 'dwoje' => 1,
2699 | 'dziś' => 1,
2700 | 'dzisiaj' => 1,
2701 | 'gdy' => 1,
2702 | 'gdyby' => 1,
2703 | 'gdyż' => 1,
2704 | 'gdzie' => 1,
2705 | 'gdziekolwiek' => 1,
2706 | 'gdzieś' => 1,
2707 | 'go' => 1,
2708 | 'i' => 1,
2709 | 'ich' => 1,
2710 | 'ile' => 1,
2711 | 'im' => 1,
2712 | 'inna' => 1,
2713 | 'inne' => 1,
2714 | 'inny' => 1,
2715 | 'innych' => 1,
2716 | 'iż' => 1,
2717 | 'ja' => 1,
2718 | 'ją' => 1,
2719 | 'jak' => 1,
2720 | 'jakaś' => 1,
2721 | 'jakby' => 1,
2722 | 'jaki' => 1,
2723 | 'jakichś' => 1,
2724 | 'jakie' => 1,
2725 | 'jakiś' => 1,
2726 | 'jakiż' => 1,
2727 | 'jakkolwiek' => 1,
2728 | 'jako' => 1,
2729 | 'jakoś' => 1,
2730 | 'je' => 1,
2731 | 'jeden' => 1,
2732 | 'jedna' => 1,
2733 | 'jedno' => 1,
2734 | 'jednak' => 1,
2735 | 'jednakże' => 1,
2736 | 'jego' => 1,
2737 | 'jej' => 1,
2738 | 'jemu' => 1,
2739 | 'jest' => 1,
2740 | 'jestem' => 1,
2741 | 'jeszcze' => 1,
2742 | 'jeśli' => 1,
2743 | 'jeżeli' => 1,
2744 | 'już' => 1,
2745 | 'każdy kiedy' => 1,
2746 | 'kilka' => 1,
2747 | 'kimś' => 1,
2748 | 'kto' => 1,
2749 | 'ktokolwiek' => 1,
2750 | 'ktoś' => 1,
2751 | 'która' => 1,
2752 | 'które' => 1,
2753 | 'którego' => 1,
2754 | 'której' => 1,
2755 | 'który' => 1,
2756 | 'których' => 1,
2757 | 'którym' => 1,
2758 | 'którzy' => 1,
2759 | 'ku' => 1,
2760 | 'lat' => 1,
2761 | 'lecz' => 1,
2762 | 'lub' => 1,
2763 | 'ma' => 1,
2764 | 'mają' => 1,
2765 | 'mam' => 1,
2766 | 'mi' => 1,
2767 | 'mimo' => 1,
2768 | 'między' => 1,
2769 | 'mną' => 1,
2770 | 'mnie' => 1,
2771 | 'mogą' => 1,
2772 | 'moi' => 1,
2773 | 'moim' => 1,
2774 | 'moja' => 1,
2775 | 'moje' => 1,
2776 | 'może' => 1,
2777 | 'możliwe' => 1,
2778 | 'można' => 1,
2779 | 'mój' => 1,
2780 | 'mu' => 1,
2781 | 'musi' => 1,
2782 | 'my' => 1,
2783 | 'na' => 1,
2784 | 'nad' => 1,
2785 | 'nam' => 1,
2786 | 'nami' => 1,
2787 | 'nas' => 1,
2788 | 'nasi' => 1,
2789 | 'nasz' => 1,
2790 | 'nasza' => 1,
2791 | 'nasze' => 1,
2792 | 'naszego' => 1,
2793 | 'naszych' => 1,
2794 | 'natomiast' => 1,
2795 | 'natychmiast' => 1,
2796 | 'nawet' => 1,
2797 | 'nią' => 1,
2798 | 'nic' => 1,
2799 | 'nich' => 1,
2800 | 'nie' => 1,
2801 | 'niego' => 1,
2802 | 'niej' => 1,
2803 | 'niemu' => 1,
2804 | 'nigdy' => 1,
2805 | 'nim' => 1,
2806 | 'nimi' => 1,
2807 | 'niż' => 1,
2808 | 'no' => 1,
2809 | 'o' => 1,
2810 | 'obok' => 1,
2811 | 'od' => 1,
2812 | 'około' => 1,
2813 | 'on' => 1,
2814 | 'ona' => 1,
2815 | 'one' => 1,
2816 | 'oni' => 1,
2817 | 'ono' => 1,
2818 | 'oraz' => 1,
2819 | 'owszem' => 1,
2820 | 'pan' => 1,
2821 | 'pana' => 1,
2822 | 'pani' => 1,
2823 | 'po' => 1,
2824 | 'pod' => 1,
2825 | 'podczas' => 1,
2826 | 'pomimo' => 1,
2827 | 'ponad' => 1,
2828 | 'ponieważ' => 1,
2829 | 'powinien' => 1,
2830 | 'powinna' => 1,
2831 | 'powinni' => 1,
2832 | 'powinno' => 1,
2833 | 'poza' => 1,
2834 | 'prawie' => 1,
2835 | 'przecież' => 1,
2836 | 'przed' => 1,
2837 | 'przede' => 1,
2838 | 'przedtem' => 1,
2839 | 'przez' => 1,
2840 | 'przy' => 1,
2841 | 'roku' => 1,
2842 | 'również' => 1,
2843 | 'sam' => 1,
2844 | 'sama są' => 1,
2845 | 'się' => 1,
2846 | 'skąd' => 1,
2847 | 'sobie' => 1,
2848 | 'sobą' => 1,
2849 | 'sposób' => 1,
2850 | 'swoje' => 1,
2851 | 'są' => 1,
2852 | 'ta' => 1,
2853 | 'tak' => 1,
2854 | 'taka' => 1,
2855 | 'taki' => 1,
2856 | 'takie' => 1,
2857 | 'także' => 1,
2858 | 'tam' => 1,
2859 | 'te' => 1,
2860 | 'tego' => 1,
2861 | 'tej' => 1,
2862 | 'ten' => 1,
2863 | 'teraz' => 1,
2864 | 'też' => 1,
2865 | 'totobą' => 1,
2866 | 'tobie' => 1,
2867 | 'toteż' => 1,
2868 | 'trzeba' => 1,
2869 | 'tu' => 1,
2870 | 'tutaj' => 1,
2871 | 'twoi' => 1,
2872 | 'twoim' => 1,
2873 | 'twoja' => 1,
2874 | 'twoje' => 1,
2875 | 'twym' => 1,
2876 | 'twój' => 1,
2877 | 'ty' => 1,
2878 | 'tych' => 1,
2879 | 'tylko' => 1,
2880 | 'tym' => 1,
2881 | 'u' => 1,
2882 | 'w' => 1,
2883 | 'wam' => 1,
2884 | 'wami' => 1,
2885 | 'was' => 1,
2886 | 'wasz' => 1,
2887 | 'wasza' => 1,
2888 | 'wasze' => 1,
2889 | 'we' => 1,
2890 | 'według' => 1,
2891 | 'wiele' => 1,
2892 | 'wielu' => 1,
2893 | 'więc' => 1,
2894 | 'więcej' => 1,
2895 | 'wszyscy' => 1,
2896 | 'wszystkich' => 1,
2897 | 'wszystkie' => 1,
2898 | 'wszystkim' => 1,
2899 | 'wszystko' => 1,
2900 | 'wtedy' => 1,
2901 | 'wy' => 1,
2902 | 'właśnie' => 1,
2903 | 'z' => 1,
2904 | 'za' => 1,
2905 | 'zapewne' => 1,
2906 | 'zawsze' => 1,
2907 | 'zeznowu' => 1,
2908 | 'znów' => 1,
2909 | 'został' => 1,
2910 | 'żaden' => 1,
2911 | 'żadna' => 1,
2912 | 'żadne' => 1,
2913 | 'żadnych' => 1,
2914 | 'że' => 1,
2915 | 'żeby' => 1,
2916 | ),
2917 | 'portuguese' =>
2918 | array (
2919 | 'último' => 1,
2920 | 'é' => 1,
2921 | 'acerca' => 1,
2922 | 'agora' => 1,
2923 | 'algmas' => 1,
2924 | 'alguns' => 1,
2925 | 'ali' => 1,
2926 | 'ambos' => 1,
2927 | 'antes' => 1,
2928 | 'apontar' => 1,
2929 | 'aquela' => 1,
2930 | 'aquelas' => 1,
2931 | 'aquele' => 1,
2932 | 'aqueles' => 1,
2933 | 'aqui' => 1,
2934 | 'atrás' => 1,
2935 | 'bem' => 1,
2936 | 'bom' => 1,
2937 | 'cada' => 1,
2938 | 'caminho' => 1,
2939 | 'cima' => 1,
2940 | 'com' => 1,
2941 | 'como' => 1,
2942 | 'comprido' => 1,
2943 | 'conhecido' => 1,
2944 | 'corrente' => 1,
2945 | 'das' => 1,
2946 | 'debaixo' => 1,
2947 | 'dentro' => 1,
2948 | 'desde' => 1,
2949 | 'desligado' => 1,
2950 | 'deve' => 1,
2951 | 'devem' => 1,
2952 | 'deverá' => 1,
2953 | 'direita' => 1,
2954 | 'diz' => 1,
2955 | 'dizer' => 1,
2956 | 'dois' => 1,
2957 | 'dos' => 1,
2958 | 'e' => 1,
2959 | 'ela' => 1,
2960 | 'ele' => 1,
2961 | 'eles' => 1,
2962 | 'em' => 1,
2963 | 'enquanto' => 1,
2964 | 'então' => 1,
2965 | 'está' => 1,
2966 | 'estão' => 1,
2967 | 'estado' => 1,
2968 | 'estar estará' => 1,
2969 | 'este' => 1,
2970 | 'estes' => 1,
2971 | 'esteve' => 1,
2972 | 'estive' => 1,
2973 | 'estivemos' => 1,
2974 | 'estiveram' => 1,
2975 | 'eu' => 1,
2976 | 'fará' => 1,
2977 | 'faz' => 1,
2978 | 'fazer' => 1,
2979 | 'fazia' => 1,
2980 | 'fez' => 1,
2981 | 'fim' => 1,
2982 | 'foi' => 1,
2983 | 'fora' => 1,
2984 | 'horas' => 1,
2985 | 'iniciar' => 1,
2986 | 'inicio' => 1,
2987 | 'ir' => 1,
2988 | 'irá' => 1,
2989 | 'ista' => 1,
2990 | 'iste' => 1,
2991 | 'isto' => 1,
2992 | 'ligado' => 1,
2993 | 'maioria' => 1,
2994 | 'maiorias' => 1,
2995 | 'mais' => 1,
2996 | 'mas' => 1,
2997 | 'mesmo' => 1,
2998 | 'meu' => 1,
2999 | 'muito' => 1,
3000 | 'muitos' => 1,
3001 | 'nós' => 1,
3002 | 'não' => 1,
3003 | 'nome' => 1,
3004 | 'nosso' => 1,
3005 | 'novo' => 1,
3006 | 'o' => 1,
3007 | 'onde' => 1,
3008 | 'os' => 1,
3009 | 'ou' => 1,
3010 | 'outro' => 1,
3011 | 'para' => 1,
3012 | 'parte' => 1,
3013 | 'pegar' => 1,
3014 | 'pelo' => 1,
3015 | 'pessoas' => 1,
3016 | 'pode' => 1,
3017 | 'poderá podia' => 1,
3018 | 'por' => 1,
3019 | 'porque' => 1,
3020 | 'povo' => 1,
3021 | 'promeiro' => 1,
3022 | 'quê' => 1,
3023 | 'qual' => 1,
3024 | 'qualquer' => 1,
3025 | 'quando' => 1,
3026 | 'quem' => 1,
3027 | 'quieto' => 1,
3028 | 'são' => 1,
3029 | 'saber' => 1,
3030 | 'sem' => 1,
3031 | 'ser' => 1,
3032 | 'seu' => 1,
3033 | 'somente' => 1,
3034 | 'têm' => 1,
3035 | 'tal' => 1,
3036 | 'também' => 1,
3037 | 'tem' => 1,
3038 | 'tempo' => 1,
3039 | 'tenho' => 1,
3040 | 'tentar' => 1,
3041 | 'tentaram' => 1,
3042 | 'tente' => 1,
3043 | 'tentei' => 1,
3044 | 'teu' => 1,
3045 | 'teve' => 1,
3046 | 'tipo' => 1,
3047 | 'tive' => 1,
3048 | 'todos' => 1,
3049 | 'trabalhar' => 1,
3050 | 'trabalho' => 1,
3051 | 'tu' => 1,
3052 | 'um' => 1,
3053 | 'uma' => 1,
3054 | 'umas' => 1,
3055 | 'uns' => 1,
3056 | 'usa' => 1,
3057 | 'usar' => 1,
3058 | 'valor' => 1,
3059 | 'veja' => 1,
3060 | 'ver' => 1,
3061 | 'verdade' => 1,
3062 | 'verdadeiro' => 1,
3063 | 'você' => 1,
3064 | ),
3065 | 'russian' =>
3066 | array (
3067 | 'а' => 1,
3068 | 'е' => 1,
3069 | 'и' => 1,
3070 | 'ж' => 1,
3071 | 'м' => 1,
3072 | 'о' => 1,
3073 | 'на' => 1,
3074 | 'не' => 1,
3075 | 'ни' => 1,
3076 | 'об' => 1,
3077 | 'но' => 1,
3078 | 'он' => 1,
3079 | 'мне' => 1,
3080 | 'мои' => 1,
3081 | 'мож' => 1,
3082 | 'она' => 1,
3083 | 'они' => 1,
3084 | 'оно' => 1,
3085 | 'мной' => 1,
3086 | 'много' => 1,
3087 | 'многочисленное' => 1,
3088 | 'многочисленная' => 1,
3089 | 'многочисленные' => 1,
3090 | 'многочисленный' => 1,
3091 | 'мною' => 1,
3092 | 'мой' => 1,
3093 | 'мог' => 1,
3094 | 'могут' => 1,
3095 | 'можно' => 1,
3096 | 'может' => 1,
3097 | 'можхо' => 1,
3098 | 'мор' => 1,
3099 | 'моя' => 1,
3100 | 'моё' => 1,
3101 | 'мочь' => 1,
3102 | 'над' => 1,
3103 | 'нее' => 1,
3104 | 'оба' => 1,
3105 | 'нам' => 1,
3106 | 'нем' => 1,
3107 | 'нами' => 1,
3108 | 'ними' => 1,
3109 | 'мимо' => 1,
3110 | 'немного' => 1,
3111 | 'одной' => 1,
3112 | 'одного' => 1,
3113 | 'менее' => 1,
3114 | 'однажды' => 1,
3115 | 'однако' => 1,
3116 | 'меня' => 1,
3117 | 'нему' => 1,
3118 | 'меньше' => 1,
3119 | 'ней' => 1,
3120 | 'наверху' => 1,
3121 | 'него' => 1,
3122 | 'ниже' => 1,
3123 | 'мало' => 1,
3124 | 'надо' => 1,
3125 | 'один' => 1,
3126 | 'одиннадцать' => 1,
3127 | 'одиннадцатый' => 1,
3128 | 'назад' => 1,
3129 | 'наиболее' => 1,
3130 | 'недавно' => 1,
3131 | 'миллионов' => 1,
3132 | 'недалеко' => 1,
3133 | 'между' => 1,
3134 | 'низко' => 1,
3135 | 'меля' => 1,
3136 | 'нельзя' => 1,
3137 | 'нибудь' => 1,
3138 | 'непрерывно' => 1,
3139 | 'наконец' => 1,
3140 | 'никогда' => 1,
3141 | 'никуда' => 1,
3142 | 'нас' => 1,
3143 | 'наш' => 1,
3144 | 'нет' => 1,
3145 | 'нею' => 1,
3146 | 'неё' => 1,
3147 | 'них' => 1,
3148 | 'мира' => 1,
3149 | 'наша' => 1,
3150 | 'наше' => 1,
3151 | 'наши' => 1,
3152 | 'ничего' => 1,
3153 | 'начала' => 1,
3154 | 'нередко' => 1,
3155 | 'несколько' => 1,
3156 | 'обычно' => 1,
3157 | 'опять' => 1,
3158 | 'около' => 1,
3159 | 'мы' => 1,
3160 | 'ну' => 1,
3161 | 'нх' => 1,
3162 | 'от' => 1,
3163 | 'отовсюду' => 1,
3164 | 'особенно' => 1,
3165 | 'нужно' => 1,
3166 | 'очень' => 1,
3167 | 'отсюда' => 1,
3168 | 'в' => 1,
3169 | 'во' => 1,
3170 | 'вон' => 1,
3171 | 'вниз' => 1,
3172 | 'внизу' => 1,
3173 | 'вокруг' => 1,
3174 | 'вот' => 1,
3175 | 'восемнадцать' => 1,
3176 | 'восемнадцатый' => 1,
3177 | 'восемь' => 1,
3178 | 'восьмой' => 1,
3179 | 'вверх' => 1,
3180 | 'вам' => 1,
3181 | 'вами' => 1,
3182 | 'важное' => 1,
3183 | 'важная' => 1,
3184 | 'важные' => 1,
3185 | 'важный' => 1,
3186 | 'вдали' => 1,
3187 | 'везде' => 1,
3188 | 'ведь' => 1,
3189 | 'вас' => 1,
3190 | 'ваш' => 1,
3191 | 'ваша' => 1,
3192 | 'ваше' => 1,
3193 | 'ваши' => 1,
3194 | 'впрочем' => 1,
3195 | 'весь' => 1,
3196 | 'вдруг' => 1,
3197 | 'вы' => 1,
3198 | 'все' => 1,
3199 | 'второй' => 1,
3200 | 'всем' => 1,
3201 | 'всеми' => 1,
3202 | 'времени' => 1,
3203 | 'время' => 1,
3204 | 'всему' => 1,
3205 | 'всего' => 1,
3206 | 'всегда' => 1,
3207 | 'всех' => 1,
3208 | 'всею' => 1,
3209 | 'всю' => 1,
3210 | 'вся' => 1,
3211 | 'всё' => 1,
3212 | 'всюду' => 1,
3213 | 'г' => 1,
3214 | ' год' => 1,
3215 | 'говорил' => 1,
3216 | 'говорит' => 1,
3217 | 'года' => 1,
3218 | 'году' => 1,
3219 | 'где' => 1,
3220 | 'да' => 1,
3221 | 'ее' => 1,
3222 | 'за' => 1,
3223 | 'из' => 1,
3224 | 'ли' => 1,
3225 | 'же' => 1,
3226 | 'им' => 1,
3227 | 'до' => 1,
3228 | 'по' => 1,
3229 | 'ими' => 1,
3230 | 'под' => 1,
3231 | 'иногда' => 1,
3232 | 'довольно' => 1,
3233 | 'именно' => 1,
3234 | 'долго' => 1,
3235 | 'позже' => 1,
3236 | 'более' => 1,
3237 | 'должно' => 1,
3238 | 'пожалуйста' => 1,
3239 | 'значит' => 1,
3240 | 'иметь' => 1,
3241 | 'больше' => 1,
3242 | 'пока' => 1,
3243 | 'ему' => 1,
3244 | 'имя' => 1,
3245 | 'пор' => 1,
3246 | 'пора' => 1,
3247 | 'потом' => 1,
3248 | 'потому' => 1,
3249 | 'после' => 1,
3250 | 'почему' => 1,
3251 | 'почти' => 1,
3252 | 'посреди' => 1,
3253 | 'ей' => 1,
3254 | 'два' => 1,
3255 | 'две' => 1,
3256 | 'двенадцать' => 1,
3257 | 'двенадцатый' => 1,
3258 | 'двадцать' => 1,
3259 | 'двадцатый' => 1,
3260 | 'двух' => 1,
3261 | 'его' => 1,
3262 | 'дел' => 1,
3263 | 'или' => 1,
3264 | 'без' => 1,
3265 | 'день' => 1,
3266 | 'занят' => 1,
3267 | 'занята' => 1,
3268 | 'занято' => 1,
3269 | 'заняты' => 1,
3270 | 'действительно' => 1,
3271 | 'давно' => 1,
3272 | 'девятнадцать' => 1,
3273 | 'девятнадцатый' => 1,
3274 | 'девять' => 1,
3275 | 'девятый' => 1,
3276 | 'даже' => 1,
3277 | 'алло' => 1,
3278 | 'жизнь' => 1,
3279 | 'далеко' => 1,
3280 | 'близко' => 1,
3281 | 'здесь' => 1,
3282 | 'дальше' => 1,
3283 | 'для' => 1,
3284 | 'лет' => 1,
3285 | 'зато' => 1,
3286 | 'даром' => 1,
3287 | 'первый' => 1,
3288 | 'перед' => 1,
3289 | 'затем' => 1,
3290 | 'зачем' => 1,
3291 | 'лишь' => 1,
3292 | 'десять' => 1,
3293 | 'десятый' => 1,
3294 | 'ею' => 1,
3295 | 'её' => 1,
3296 | 'их' => 1,
3297 | 'бы' => 1,
3298 | 'еще' => 1,
3299 | 'при' => 1,
3300 | 'был' => 1,
3301 | 'про' => 1,
3302 | 'процентов' => 1,
3303 | 'против' => 1,
3304 | 'просто' => 1,
3305 | 'бывает' => 1,
3306 | 'бывь' => 1,
3307 | 'если' => 1,
3308 | 'люди' => 1,
3309 | 'была' => 1,
3310 | 'были' => 1,
3311 | 'было' => 1,
3312 | 'будем' => 1,
3313 | 'будет' => 1,
3314 | 'будете' => 1,
3315 | 'будешь' => 1,
3316 | 'прекрасно' => 1,
3317 | 'буду' => 1,
3318 | 'будь' => 1,
3319 | 'будто' => 1,
3320 | 'будут' => 1,
3321 | 'ещё' => 1,
3322 | 'пятнадцать' => 1,
3323 | 'пятнадцатый' => 1,
3324 | 'друго' => 1,
3325 | 'другое' => 1,
3326 | 'другой' => 1,
3327 | 'другие' => 1,
3328 | 'другая' => 1,
3329 | 'других' => 1,
3330 | 'есть' => 1,
3331 | 'пять' => 1,
3332 | 'быть' => 1,
3333 | 'лучше' => 1,
3334 | 'пятый' => 1,
3335 | 'к' => 1,
3336 | 'ком' => 1,
3337 | 'конечно' => 1,
3338 | 'кому' => 1,
3339 | 'кого' => 1,
3340 | 'когда' => 1,
3341 | 'которой' => 1,
3342 | 'которого' => 1,
3343 | 'которая' => 1,
3344 | 'которые' => 1,
3345 | 'который' => 1,
3346 | 'которых' => 1,
3347 | 'кем' => 1,
3348 | 'каждое' => 1,
3349 | 'каждая' => 1,
3350 | 'каждые' => 1,
3351 | 'каждый' => 1,
3352 | 'кажется' => 1,
3353 | 'как' => 1,
3354 | 'какой' => 1,
3355 | 'какая' => 1,
3356 | 'кто' => 1,
3357 | 'кроме' => 1,
3358 | 'куда' => 1,
3359 | 'кругом' => 1,
3360 | 'с' => 1,
3361 | ' т' => 1,
3362 | 'у' => 1,
3363 | 'я' => 1,
3364 | 'та' => 1,
3365 | 'те' => 1,
3366 | 'уж' => 1,
3367 | 'со' => 1,
3368 | 'то' => 1,
3369 | 'том' => 1,
3370 | 'снова' => 1,
3371 | 'тому' => 1,
3372 | 'совсем' => 1,
3373 | 'того' => 1,
3374 | 'тогда' => 1,
3375 | 'тоже' => 1,
3376 | 'собой' => 1,
3377 | 'тобой' => 1,
3378 | 'собою' => 1,
3379 | 'тобою' => 1,
3380 | 'сначала' => 1,
3381 | 'только' => 1,
3382 | 'уметь' => 1,
3383 | 'тот' => 1,
3384 | 'тою' => 1,
3385 | 'хорошо' => 1,
3386 | 'хотеть' => 1,
3387 | 'хочешь' => 1,
3388 | 'хоть' => 1,
3389 | 'хотя' => 1,
3390 | 'свое' => 1,
3391 | 'свои' => 1,
3392 | 'твой' => 1,
3393 | 'своей' => 1,
3394 | 'своего' => 1,
3395 | 'своих' => 1,
3396 | 'свою' => 1,
3397 | 'твоя' => 1,
3398 | 'твоё' => 1,
3399 | 'раз' => 1,
3400 | 'уже' => 1,
3401 | 'сам' => 1,
3402 | 'там' => 1,
3403 | 'тем' => 1,
3404 | 'чем' => 1,
3405 | 'сама' => 1,
3406 | 'сами' => 1,
3407 | 'теми' => 1,
3408 | 'само' => 1,
3409 | 'рано' => 1,
3410 | 'самом' => 1,
3411 | 'самому' => 1,
3412 | 'самой' => 1,
3413 | 'самого' => 1,
3414 | 'семнадцать' => 1,
3415 | 'семнадцатый' => 1,
3416 | 'самим' => 1,
3417 | 'самими' => 1,
3418 | 'самих' => 1,
3419 | 'саму' => 1,
3420 | 'семь' => 1,
3421 | 'чему' => 1,
3422 | 'раньше' => 1,
3423 | 'сейчас' => 1,
3424 | 'чего' => 1,
3425 | 'сегодня' => 1,
3426 | 'себе' => 1,
3427 | 'тебе' => 1,
3428 | 'сеаой' => 1,
3429 | 'человек' => 1,
3430 | 'разве' => 1,
3431 | 'теперь' => 1,
3432 | 'себя' => 1,
3433 | 'тебя' => 1,
3434 | 'седьмой' => 1,
3435 | 'спасибо' => 1,
3436 | 'слишком' => 1,
3437 | 'так' => 1,
3438 | 'такое' => 1,
3439 | 'такой' => 1,
3440 | 'такие' => 1,
3441 | 'также' => 1,
3442 | 'такая' => 1,
3443 | 'сих' => 1,
3444 | 'тех' => 1,
3445 | 'чаще' => 1,
3446 | 'четвертый' => 1,
3447 | 'через' => 1,
3448 | 'часто' => 1,
3449 | 'шестой' => 1,
3450 | 'шестнадцать' => 1,
3451 | 'шестнадцатый' => 1,
3452 | 'шесть' => 1,
3453 | 'четыре' => 1,
3454 | 'четырнадцать' => 1,
3455 | 'четырнадцатый' => 1,
3456 | 'сколько' => 1,
3457 | 'сказал' => 1,
3458 | 'сказала' => 1,
3459 | 'сказать' => 1,
3460 | 'ту' => 1,
3461 | 'ты' => 1,
3462 | 'три' => 1,
3463 | 'эта' => 1,
3464 | 'эти' => 1,
3465 | 'что' => 1,
3466 | 'это' => 1,
3467 | 'чтоб' => 1,
3468 | 'этом' => 1,
3469 | 'этому' => 1,
3470 | 'этой' => 1,
3471 | 'этого' => 1,
3472 | 'чтобы' => 1,
3473 | 'этот' => 1,
3474 | 'стал' => 1,
3475 | 'туда' => 1,
3476 | 'этим' => 1,
3477 | 'этими' => 1,
3478 | 'рядом' => 1,
3479 | 'тринадцать' => 1,
3480 | 'тринадцатый' => 1,
3481 | 'этих' => 1,
3482 | 'третий' => 1,
3483 | 'тут' => 1,
3484 | 'эту' => 1,
3485 | 'суть' => 1,
3486 | 'чуть' => 1,
3487 | 'тысяч' => 1,
3488 | ),
3489 | 'spanish' =>
3490 | array (
3491 | 'un' => 1,
3492 | 'una' => 1,
3493 | 'unas' => 1,
3494 | 'unos' => 1,
3495 | 'uno' => 1,
3496 | 'sobre' => 1,
3497 | 'todo' => 1,
3498 | 'también' => 1,
3499 | 'tras' => 1,
3500 | 'otro' => 1,
3501 | 'algún' => 1,
3502 | 'alguno' => 1,
3503 | 'alguna' => 1,
3504 | 'algunos' => 1,
3505 | 'algunas' => 1,
3506 | 'ser' => 1,
3507 | 'es' => 1,
3508 | 'soy' => 1,
3509 | 'eres' => 1,
3510 | 'somos' => 1,
3511 | 'sois' => 1,
3512 | 'estoy' => 1,
3513 | 'esta' => 1,
3514 | 'estamos' => 1,
3515 | 'estais' => 1,
3516 | 'estan' => 1,
3517 | 'como' => 1,
3518 | 'en' => 1,
3519 | 'para' => 1,
3520 | 'atras' => 1,
3521 | 'porque' => 1,
3522 | 'por qué' => 1,
3523 | 'estado' => 1,
3524 | 'estaba' => 1,
3525 | 'ante' => 1,
3526 | 'antes' => 1,
3527 | 'siendo' => 1,
3528 | 'ambos' => 1,
3529 | 'pero' => 1,
3530 | 'por' => 1,
3531 | 'poder' => 1,
3532 | 'puede' => 1,
3533 | 'puedo' => 1,
3534 | 'podemos' => 1,
3535 | 'podeis' => 1,
3536 | 'pueden' => 1,
3537 | 'fui' => 1,
3538 | 'fue' => 1,
3539 | 'fuimos' => 1,
3540 | 'fueron' => 1,
3541 | 'hacer' => 1,
3542 | 'hago' => 1,
3543 | 'hace' => 1,
3544 | 'hacemos' => 1,
3545 | 'haceis' => 1,
3546 | 'hacen' => 1,
3547 | 'cada' => 1,
3548 | 'fin' => 1,
3549 | 'incluso' => 1,
3550 | 'primero desde' => 1,
3551 | 'conseguir' => 1,
3552 | 'consigo' => 1,
3553 | 'consigue' => 1,
3554 | 'consigues' => 1,
3555 | 'conseguimos' => 1,
3556 | 'consiguen' => 1,
3557 | 'ir' => 1,
3558 | 'voy' => 1,
3559 | 'va' => 1,
3560 | 'vamos' => 1,
3561 | 'vais' => 1,
3562 | 'van' => 1,
3563 | 'vaya' => 1,
3564 | 'gueno' => 1,
3565 | 'ha' => 1,
3566 | 'tener' => 1,
3567 | 'tengo' => 1,
3568 | 'tiene' => 1,
3569 | 'tenemos' => 1,
3570 | 'teneis' => 1,
3571 | 'tienen' => 1,
3572 | 'el' => 1,
3573 | 'la' => 1,
3574 | 'lo' => 1,
3575 | 'las' => 1,
3576 | 'los' => 1,
3577 | 'su' => 1,
3578 | 'aqui' => 1,
3579 | 'mio' => 1,
3580 | 'tuyo' => 1,
3581 | 'ellos' => 1,
3582 | 'ellas' => 1,
3583 | 'nos' => 1,
3584 | 'nosotros' => 1,
3585 | 'vosotros' => 1,
3586 | 'vosotras' => 1,
3587 | 'si' => 1,
3588 | 'dentro' => 1,
3589 | 'solo' => 1,
3590 | 'solamente' => 1,
3591 | 'saber' => 1,
3592 | 'sabes' => 1,
3593 | 'sabe' => 1,
3594 | 'sabemos' => 1,
3595 | 'sabeis' => 1,
3596 | 'saben' => 1,
3597 | 'ultimo' => 1,
3598 | 'largo' => 1,
3599 | 'bastante' => 1,
3600 | 'haces' => 1,
3601 | 'muchos' => 1,
3602 | 'aquellos' => 1,
3603 | 'aquellas' => 1,
3604 | 'sus' => 1,
3605 | 'entonces' => 1,
3606 | 'tiempo' => 1,
3607 | 'verdad' => 1,
3608 | 'verdadero' => 1,
3609 | 'verdadera cierto' => 1,
3610 | 'ciertos' => 1,
3611 | 'cierta' => 1,
3612 | 'ciertas' => 1,
3613 | 'intentar' => 1,
3614 | 'intento' => 1,
3615 | 'intenta' => 1,
3616 | 'intentas' => 1,
3617 | 'intentamos' => 1,
3618 | 'intentais' => 1,
3619 | 'intentan' => 1,
3620 | 'dos' => 1,
3621 | 'bajo' => 1,
3622 | 'arriba' => 1,
3623 | 'encima' => 1,
3624 | 'usar' => 1,
3625 | 'uso' => 1,
3626 | 'usas' => 1,
3627 | 'usa' => 1,
3628 | 'usamos' => 1,
3629 | 'usais' => 1,
3630 | 'usan' => 1,
3631 | 'emplear' => 1,
3632 | 'empleo' => 1,
3633 | 'empleas' => 1,
3634 | 'emplean' => 1,
3635 | 'ampleamos' => 1,
3636 | 'empleais' => 1,
3637 | 'valor' => 1,
3638 | 'muy' => 1,
3639 | 'era' => 1,
3640 | 'eras' => 1,
3641 | 'eramos' => 1,
3642 | 'eran' => 1,
3643 | 'modo' => 1,
3644 | 'bien' => 1,
3645 | 'cual' => 1,
3646 | 'cuando' => 1,
3647 | 'donde' => 1,
3648 | 'mientras' => 1,
3649 | 'quien' => 1,
3650 | 'con' => 1,
3651 | 'entre' => 1,
3652 | 'sin' => 1,
3653 | 'trabajo' => 1,
3654 | 'trabajar' => 1,
3655 | 'trabajas' => 1,
3656 | 'trabaja' => 1,
3657 | 'trabajamos' => 1,
3658 | 'trabajais' => 1,
3659 | 'trabajan' => 1,
3660 | 'podria' => 1,
3661 | 'podrias' => 1,
3662 | 'podriamos' => 1,
3663 | 'podrian' => 1,
3664 | 'podriais' => 1,
3665 | 'yo' => 1,
3666 | 'aquel' => 1,
3667 | ),
3668 | 'swedish' =>
3669 | array (
3670 | 'aderton' => 1,
3671 | 'adertonde' => 1,
3672 | 'adjö' => 1,
3673 | 'aldrig' => 1,
3674 | 'alla' => 1,
3675 | 'allas' => 1,
3676 | 'allt' => 1,
3677 | 'alltid' => 1,
3678 | 'alltså' => 1,
3679 | 'än' => 1,
3680 | 'andra' => 1,
3681 | 'andras' => 1,
3682 | 'annan' => 1,
3683 | 'annat' => 1,
3684 | 'ännu' => 1,
3685 | 'artonde' => 1,
3686 | 'artonn' => 1,
3687 | 'åtminstone' => 1,
3688 | 'att' => 1,
3689 | 'åtta' => 1,
3690 | 'åttio' => 1,
3691 | 'åttionde' => 1,
3692 | 'åttonde' => 1,
3693 | 'av' => 1,
3694 | 'även' => 1,
3695 | 'båda' => 1,
3696 | 'bådas' => 1,
3697 | 'bakom' => 1,
3698 | 'bara' => 1,
3699 | 'bäst' => 1,
3700 | 'bättre' => 1,
3701 | 'behöva' => 1,
3702 | 'behövas' => 1,
3703 | 'behövde' => 1,
3704 | 'behövt' => 1,
3705 | 'beslut' => 1,
3706 | 'beslutat' => 1,
3707 | 'beslutit' => 1,
3708 | 'bland' => 1,
3709 | 'blev' => 1,
3710 | 'bli' => 1,
3711 | 'blir' => 1,
3712 | 'blivit' => 1,
3713 | 'bort' => 1,
3714 | 'borta' => 1,
3715 | 'bra' => 1,
3716 | 'då' => 1,
3717 | 'dag' => 1,
3718 | 'dagar' => 1,
3719 | 'dagarna' => 1,
3720 | 'dagen' => 1,
3721 | 'där' => 1,
3722 | 'därför' => 1,
3723 | 'de' => 1,
3724 | 'del' => 1,
3725 | 'delen' => 1,
3726 | 'dem' => 1,
3727 | 'den' => 1,
3728 | 'deras' => 1,
3729 | 'dess' => 1,
3730 | 'det' => 1,
3731 | 'detta' => 1,
3732 | 'dig' => 1,
3733 | 'din' => 1,
3734 | 'dina' => 1,
3735 | 'dit' => 1,
3736 | 'ditt' => 1,
3737 | 'dock' => 1,
3738 | 'du' => 1,
3739 | 'efter' => 1,
3740 | 'eftersom' => 1,
3741 | 'elfte' => 1,
3742 | 'eller' => 1,
3743 | 'elva' => 1,
3744 | 'en' => 1,
3745 | 'enkel' => 1,
3746 | 'enkelt' => 1,
3747 | 'enkla' => 1,
3748 | 'enligt' => 1,
3749 | 'er' => 1,
3750 | 'era' => 1,
3751 | 'ert' => 1,
3752 | 'ett' => 1,
3753 | 'ettusen' => 1,
3754 | 'få' => 1,
3755 | 'fanns' => 1,
3756 | 'får' => 1,
3757 | 'fått' => 1,
3758 | 'fem' => 1,
3759 | 'femte' => 1,
3760 | 'femtio' => 1,
3761 | 'femtionde' => 1,
3762 | 'femton' => 1,
3763 | 'femtonde' => 1,
3764 | 'fick' => 1,
3765 | 'fin' => 1,
3766 | 'finnas' => 1,
3767 | 'finns' => 1,
3768 | 'fjärde' => 1,
3769 | 'fjorton' => 1,
3770 | 'fjortonde' => 1,
3771 | 'fler' => 1,
3772 | 'flera' => 1,
3773 | 'flesta' => 1,
3774 | 'följande' => 1,
3775 | 'för' => 1,
3776 | 'före' => 1,
3777 | 'förlåt' => 1,
3778 | 'förra' => 1,
3779 | 'första' => 1,
3780 | 'fram' => 1,
3781 | 'framför' => 1,
3782 | 'från' => 1,
3783 | 'fyra' => 1,
3784 | 'fyrtio' => 1,
3785 | 'fyrtionde' => 1,
3786 | 'gå' => 1,
3787 | 'gälla' => 1,
3788 | 'gäller' => 1,
3789 | 'gällt' => 1,
3790 | 'går' => 1,
3791 | 'gärna' => 1,
3792 | 'gått' => 1,
3793 | 'genast' => 1,
3794 | 'genom' => 1,
3795 | 'gick' => 1,
3796 | 'gjorde' => 1,
3797 | 'gjort' => 1,
3798 | 'god' => 1,
3799 | 'goda' => 1,
3800 | 'godare' => 1,
3801 | 'godast' => 1,
3802 | 'gör' => 1,
3803 | 'göra' => 1,
3804 | 'gott' => 1,
3805 | 'ha' => 1,
3806 | 'hade' => 1,
3807 | 'haft' => 1,
3808 | 'han' => 1,
3809 | 'hans' => 1,
3810 | 'har' => 1,
3811 | 'här' => 1,
3812 | 'heller' => 1,
3813 | 'hellre' => 1,
3814 | 'helst' => 1,
3815 | 'helt' => 1,
3816 | 'henne' => 1,
3817 | 'hennes' => 1,
3818 | 'hit' => 1,
3819 | 'hög' => 1,
3820 | 'höger' => 1,
3821 | 'högre' => 1,
3822 | 'högst' => 1,
3823 | 'hon' => 1,
3824 | 'honom' => 1,
3825 | 'hundra' => 1,
3826 | 'hundraen' => 1,
3827 | 'hundraett' => 1,
3828 | 'hur' => 1,
3829 | 'i' => 1,
3830 | 'ibland' => 1,
3831 | 'idag' => 1,
3832 | 'igår' => 1,
3833 | 'igen' => 1,
3834 | 'imorgon' => 1,
3835 | 'in' => 1,
3836 | 'inför' => 1,
3837 | 'inga' => 1,
3838 | 'ingen' => 1,
3839 | 'ingenting' => 1,
3840 | 'inget' => 1,
3841 | 'innan' => 1,
3842 | 'inne' => 1,
3843 | 'inom' => 1,
3844 | 'inte' => 1,
3845 | 'inuti' => 1,
3846 | 'ja' => 1,
3847 | 'jag' => 1,
3848 | 'jämfört' => 1,
3849 | 'kan' => 1,
3850 | ' kanske' => 1,
3851 | 'knappast' => 1,
3852 | 'kom' => 1,
3853 | 'komma' => 1,
3854 | 'kommer' => 1,
3855 | 'kommit' => 1,
3856 | 'kr' => 1,
3857 | 'kunde' => 1,
3858 | 'kunna' => 1,
3859 | 'kunnat' => 1,
3860 | 'kvar' => 1,
3861 | 'länge' => 1,
3862 | 'längre' => 1,
3863 | 'långsam' => 1,
3864 | 'långsammare' => 1,
3865 | 'långsammast' => 1,
3866 | 'långsamt' => 1,
3867 | 'längst' => 1,
3868 | 'långt' => 1,
3869 | 'lätt' => 1,
3870 | 'lättare' => 1,
3871 | 'lättast' => 1,
3872 | 'legat' => 1,
3873 | 'ligga' => 1,
3874 | 'ligger' => 1,
3875 | 'lika' => 1,
3876 | 'likställd' => 1,
3877 | 'likställda' => 1,
3878 | 'lilla' => 1,
3879 | 'lite' => 1,
3880 | 'liten' => 1,
3881 | 'litet' => 1,
3882 | 'man' => 1,
3883 | 'många' => 1,
3884 | 'måste' => 1,
3885 | 'med' => 1,
3886 | 'mellan' => 1,
3887 | 'men' => 1,
3888 | 'mer' => 1,
3889 | 'mera' => 1,
3890 | 'mest' => 1,
3891 | 'mig' => 1,
3892 | 'min' => 1,
3893 | 'mina' => 1,
3894 | 'mindre' => 1,
3895 | 'minst' => 1,
3896 | 'mitt' => 1,
3897 | 'mittemot' => 1,
3898 | 'möjlig' => 1,
3899 | 'möjligen' => 1,
3900 | 'möjligt' => 1,
3901 | 'möjligtvis' => 1,
3902 | 'mot' => 1,
3903 | 'mycket' => 1,
3904 | 'någon' => 1,
3905 | 'någonting' => 1,
3906 | 'något' => 1,
3907 | 'några' => 1,
3908 | 'när' => 1,
3909 | 'nästa' => 1,
3910 | 'ned' => 1,
3911 | 'nederst' => 1,
3912 | 'nedersta' => 1,
3913 | 'nedre' => 1,
3914 | 'nej' => 1,
3915 | 'ner' => 1,
3916 | 'ni' => 1,
3917 | 'nio' => 1,
3918 | 'nionde' => 1,
3919 | 'nittio' => 1,
3920 | 'nittionde' => 1,
3921 | 'nitton' => 1,
3922 | 'nittonde' => 1,
3923 | 'nödvändig' => 1,
3924 | 'nödvändiga' => 1,
3925 | 'nödvändigt' => 1,
3926 | 'nödvändigtvis' => 1,
3927 | 'nog' => 1,
3928 | 'noll' => 1,
3929 | 'nr' => 1,
3930 | 'nu' => 1,
3931 | 'nummer' => 1,
3932 | 'och' => 1,
3933 | 'också' => 1,
3934 | 'ofta' => 1,
3935 | 'oftast' => 1,
3936 | 'olika' => 1,
3937 | 'olikt' => 1,
3938 | 'om' => 1,
3939 | 'oss' => 1,
3940 | 'över' => 1,
3941 | 'övermorgon' => 1,
3942 | 'överst' => 1,
3943 | 'övre' => 1,
3944 | 'på' => 1,
3945 | 'rakt' => 1,
3946 | 'rätt' => 1,
3947 | 'redan' => 1,
3948 | 'så' => 1,
3949 | 'sade' => 1,
3950 | 'säga' => 1,
3951 | 'säger' => 1,
3952 | 'sagt' => 1,
3953 | 'samma' => 1,
3954 | 'sämre' => 1,
3955 | 'sämst' => 1,
3956 | 'sedan' => 1,
3957 | 'senare' => 1,
3958 | 'senast' => 1,
3959 | 'sent' => 1,
3960 | 'sex' => 1,
3961 | 'sextio' => 1,
3962 | 'sextionde' => 1,
3963 | 'sexton' => 1,
3964 | 'sextonde' => 1,
3965 | 'sig' => 1,
3966 | 'sin' => 1,
3967 | 'sina' => 1,
3968 | 'sist' => 1,
3969 | 'sista' => 1,
3970 | 'siste' => 1,
3971 | 'sitt' => 1,
3972 | 'sjätte' => 1,
3973 | 'sju' => 1,
3974 | 'sjunde' => 1,
3975 | 'sjuttio' => 1,
3976 | 'sjuttionde' => 1,
3977 | 'sjutton' => 1,
3978 | 'sjuttonde' => 1,
3979 | 'ska' => 1,
3980 | 'skall' => 1,
3981 | 'skulle' => 1,
3982 | 'slutligen' => 1,
3983 | 'små' => 1,
3984 | 'smått' => 1,
3985 | 'snart' => 1,
3986 | 'som' => 1,
3987 | 'stor' => 1,
3988 | 'stora' => 1,
3989 | 'större' => 1,
3990 | 'störst' => 1,
3991 | 'stort' => 1,
3992 | 'tack' => 1,
3993 | 'tidig' => 1,
3994 | 'tidigare' => 1,
3995 | 'tidigast' => 1,
3996 | 'tidigt' => 1,
3997 | 'till' => 1,
3998 | 'tills' => 1,
3999 | 'tillsammans' => 1,
4000 | 'tio' => 1,
4001 | 'tionde' => 1,
4002 | 'tjugo' => 1,
4003 | 'tjugoen' => 1,
4004 | 'tjugoett' => 1,
4005 | 'tjugonde' => 1,
4006 | 'tjugotre' => 1,
4007 | 'tjugotvå' => 1,
4008 | 'tjungo' => 1,
4009 | 'tolfte' => 1,
4010 | 'tolv' => 1,
4011 | 'tre' => 1,
4012 | 'tredje' => 1,
4013 | 'trettio' => 1,
4014 | 'trettionde' => 1,
4015 | 'tretton' => 1,
4016 | 'trettonde' => 1,
4017 | 'två' => 1,
4018 | 'tvåhundra' => 1,
4019 | 'under' => 1,
4020 | 'upp' => 1,
4021 | 'ur' => 1,
4022 | 'ursäkt' => 1,
4023 | 'ut' => 1,
4024 | 'utan' => 1,
4025 | 'utanför' => 1,
4026 | 'ute' => 1,
4027 | 'vad' => 1,
4028 | 'vänster' => 1,
4029 | 'vänstra' => 1,
4030 | ' var' => 1,
4031 | 'vår' => 1,
4032 | 'vara' => 1,
4033 | 'våra' => 1,
4034 | 'varför' => 1,
4035 | 'varifrån' => 1,
4036 | 'varit' => 1,
4037 | 'varken' => 1,
4038 | 'värre' => 1,
4039 | 'varsågod' => 1,
4040 | 'vart' => 1,
4041 | 'vårt' => 1,
4042 | 'vem' => 1,
4043 | 'vems' => 1,
4044 | 'verkligen' => 1,
4045 | 'vi' => 1,
4046 | 'vid' => 1,
4047 | 'vidare' => 1,
4048 | 'viktig' => 1,
4049 | 'viktigare' => 1,
4050 | 'viktigast' => 1,
4051 | 'viktigt' => 1,
4052 | 'vilka' => 1,
4053 | 'vilken' => 1,
4054 | 'vilket' => 1,
4055 | 'vill' => 1,
4056 | ),
4057 | 'turkish' =>
4058 | array (
4059 | 'acaba' => 1,
4060 | 'altmýþ' => 1,
4061 | 'altý' => 1,
4062 | 'ama' => 1,
4063 | 'bana' => 1,
4064 | 'bazý' => 1,
4065 | 'belki' => 1,
4066 | 'ben' => 1,
4067 | 'benden' => 1,
4068 | 'beni' => 1,
4069 | 'benim' => 1,
4070 | 'beþ' => 1,
4071 | 'bin' => 1,
4072 | 'bir' => 1,
4073 | 'biri' => 1,
4074 | 'birkaç' => 1,
4075 | 'birkez' => 1,
4076 | 'birþey' => 1,
4077 | 'birþeyi' => 1,
4078 | 'biz' => 1,
4079 | 'bizden' => 1,
4080 | 'bizi' => 1,
4081 | 'bizim' => 1,
4082 | 'bu' => 1,
4083 | 'buna' => 1,
4084 | 'bunda' => 1,
4085 | 'bundan' => 1,
4086 | 'bunu' => 1,
4087 | 'bunun' => 1,
4088 | 'da' => 1,
4089 | 'daha' => 1,
4090 | 'dahi' => 1,
4091 | 'de' => 1,
4092 | 'defa' => 1,
4093 | 'diye' => 1,
4094 | 'doksan' => 1,
4095 | 'dokuz' => 1,
4096 | 'dört' => 1,
4097 | 'elli' => 1,
4098 | 'en gibi' => 1,
4099 | 'hem' => 1,
4100 | 'hep' => 1,
4101 | 'hepsi' => 1,
4102 | 'her' => 1,
4103 | 'hiç' => 1,
4104 | 'iki' => 1,
4105 | 'ile' => 1,
4106 | 'INSERmi' => 1,
4107 | 'ise' => 1,
4108 | 'için' => 1,
4109 | 'katrilyon' => 1,
4110 | 'kez' => 1,
4111 | 'ki' => 1,
4112 | 'kim' => 1,
4113 | 'kimden' => 1,
4114 | 'kime' => 1,
4115 | 'kimi' => 1,
4116 | 'kýrk' => 1,
4117 | 'milyar' => 1,
4118 | 'milyon' => 1,
4119 | 'mu' => 1,
4120 | 'mü' => 1,
4121 | 'mý' => 1,
4122 | 'nasýl' => 1,
4123 | 'ne' => 1,
4124 | 'neden' => 1,
4125 | 'nerde' => 1,
4126 | 'nerede' => 1,
4127 | 'nereye' => 1,
4128 | 'niye' => 1,
4129 | 'niçin' => 1,
4130 | 'on' => 1,
4131 | 'ona' => 1,
4132 | 'ondan' => 1,
4133 | 'onlar' => 1,
4134 | 'onlardan' => 1,
4135 | 'onlari' => 1,
4136 | 'onlarýn' => 1,
4137 | 'onu otuz' => 1,
4138 | 'sanki' => 1,
4139 | 'sekiz' => 1,
4140 | 'seksen' => 1,
4141 | 'sen' => 1,
4142 | 'senden' => 1,
4143 | 'seni' => 1,
4144 | 'senin' => 1,
4145 | 'siz' => 1,
4146 | 'sizden' => 1,
4147 | 'sizi' => 1,
4148 | 'sizin' => 1,
4149 | 'trilyon' => 1,
4150 | 'tüm' => 1,
4151 | 've' => 1,
4152 | 'veya' => 1,
4153 | 'ya' => 1,
4154 | 'yani' => 1,
4155 | 'yedi' => 1,
4156 | 'yetmiþ' => 1,
4157 | 'yirmi' => 1,
4158 | 'yüz' => 1,
4159 | 'çok' => 1,
4160 | 'çünkü' => 1,
4161 | 'üç' => 1,
4162 | 'þey' => 1,
4163 | 'þeyden' => 1,
4164 | 'þeyi' => 1,
4165 | 'þeyler' => 1,
4166 | 'þu' => 1,
4167 | 'þuna' => 1,
4168 | 'þunda' => 1,
4169 | 'þundan' => 1,
4170 | 'þunu' => 1,
4171 | ),
4172 | );
--------------------------------------------------------------------------------
/lib/TextRank/Stopword/czech-stopwords.txt:
--------------------------------------------------------------------------------
1 | dnes
2 | cz
3 | timto
4 | budes
5 | budem
6 | byli
7 | jses
8 | muj
9 | svym
10 | ta
11 | tomto
12 | tohle
13 | tuto
14 | tyto
15 | jej
16 | zda
17 | proc
18 | mate
19 | tato
20 | kam
21 | tohoto
22 | kdo
23 | kteri
24 | mi
25 | nam
26 | tom
27 | tomuto
28 | mit
29 | nic
30 | proto
31 | kterou
32 | byla
33 | toho
34 | protoze
35 | asi
36 | ho
37 | nasi
38 | napiste
39 | re
40 | coz
41 | tim
42 | takze
43 | svych
44 | jeji
45 | svymi
46 | jste
47 | aj
48 | tu
49 | tedy
50 | teto bylo
51 | kde
52 | ke
53 | prave
54 | ji
55 | nad
56 | nejsou
57 | ci
58 | pod
59 | tema
60 | mezi
61 | pres
62 | ty
63 | pak
64 | vam
65 | ani
66 | kdyz
67 | vsak
68 | ne
69 | jsem
70 | tento
71 | clanku
72 | clanky
73 | aby
74 | jsme
75 | pred
76 | pta
77 | jejich
78 | byl
79 | jeste
80 | az
81 | bez
82 | take
83 | pouze
84 | prvni
85 | vase
86 | ktera
87 | nas
88 | novy
89 | tipy
90 | pokud
91 | muze
92 | design
93 | strana
94 | jeho
95 | sve
96 | jine
97 | zpravy
98 | nove
99 | neni vas
100 | jen
101 | podle
102 | zde
103 | clanek
104 | uz
105 | email
106 | byt
107 | vice
108 | bude
109 | jiz
110 | nez
111 | ktery
112 | by
113 | ktere
114 | co
115 | nebo
116 | ten
117 | tak
118 | ma
119 | pri
120 | od
121 | po
122 | jsou
123 | jak
124 | dalsi
125 | ale
126 | si
127 | ve
128 | to
129 | jako
130 | za
131 | zpet
132 | ze
133 | do
134 | pro
135 | je
136 | na
137 |
--------------------------------------------------------------------------------
/lib/TextRank/Stopword/danish-stopwords.txt:
--------------------------------------------------------------------------------
1 | af
2 | alle
3 | andet
4 | andre
5 | at
6 | begge
7 | da
8 | de
9 | den
10 | denne
11 | der
12 | deres
13 | det
14 | dette
15 | dig
16 | din
17 | dog
18 | du
19 | ej
20 | eller
21 | en
22 | end
23 | ene
24 | eneste
25 | enhver
26 | et
27 | fem
28 | fire
29 | flere
30 | fleste
31 | for
32 | fordi
33 | forrige
34 | fra
35 | få
36 | før
37 | god
38 | han
39 | hans
40 | har
41 | hendes
42 | her
43 | hun
44 | hvad
45 | hvem
46 | hver
47 | hvilken
48 | hvis
49 | hvor
50 | hvordan
51 | hvorfor
52 | hvornår
53 | i
54 | ikke
55 | ind
56 | ingen
57 | intet
58 | jeg
59 | jeres
60 | kan
61 | kom
62 | kommer
63 | lav
64 | lidt
65 | lille
66 | man
67 | mand
68 | mange
69 | med
70 | meget
71 | men
72 | mens
73 | mere
74 | mig
75 | ned
76 | ni
77 | nogen
78 | noget
79 | ny
80 | nyt
81 | nær
82 | næste
83 | næsten
84 | og
85 | op
86 | otte
87 | over
88 | på
89 | se
90 | seks
91 | ses
92 | som
93 | stor
94 | store
95 | syv
96 | ti
97 | til
98 | to
99 | tre
100 | ud
101 | var
102 |
--------------------------------------------------------------------------------
/lib/TextRank/Stopword/dutch-stopwords.txt:
--------------------------------------------------------------------------------
1 | aan
2 | af
3 | al
4 | als
5 | bij
6 | dan
7 | dat
8 | die
9 | dit
10 | een
11 | en
12 | er
13 | had
14 | heb
15 | hem
16 | het
17 | hij
18 | hoe
19 | hun
20 | ik
21 | in
22 | is
23 | je
24 | kan
25 | me
26 | men
27 | met
28 | mij
29 | nog
30 | nu
31 | of
32 | ons
33 | ook
34 | te
35 | tot
36 | uit
37 | van
38 | was
39 | wat
40 | we
41 | wel
42 | wij
43 | zal
44 | ze
45 | zei
46 | zij
47 | zo
48 | zou
49 |
--------------------------------------------------------------------------------
/lib/TextRank/Stopword/english-stopwords.txt:
--------------------------------------------------------------------------------
1 | a
2 | about
3 | above
4 | after
5 | again
6 | against
7 | all
8 | am
9 | an
10 | and
11 | any
12 | are
13 | aren't
14 | as
15 | at
16 | be
17 | because
18 | been
19 | before
20 | being
21 | below
22 | between
23 | both
24 | but
25 | by
26 | can't
27 | cannot
28 | could
29 | couldn't
30 | did
31 | didn't
32 | do
33 | does
34 | doesn't
35 | doing
36 | don't
37 | down
38 | during
39 | each
40 | e.g.
41 | few
42 | for
43 | from
44 | further
45 | had
46 | hadn't
47 | has
48 | hasn't
49 | have
50 | haven't
51 | having
52 | he
53 | he'd
54 | he'll
55 | he's
56 | her
57 | here
58 | here's
59 | hers
60 | herself
61 | him
62 | himself
63 | his
64 | how
65 | how's
66 | i
67 | i'd
68 | i'll
69 | i'm
70 | i've
71 | if
72 | in
73 | into
74 | is
75 | isn't
76 | it
77 | it's
78 | its
79 | itself
80 | let's
81 | me
82 | more
83 | most
84 | mustn't
85 | my
86 | myself
87 | no
88 | nor
89 | not
90 | of
91 | off
92 | on
93 | once
94 | only
95 | or
96 | other
97 | ought
98 | our
99 | ours
100 | ourselves
101 | out
102 | over
103 | own
104 | same
105 | shan't
106 | she
107 | she'd
108 | she'll
109 | she's
110 | should
111 | shouldn't
112 | so
113 | some
114 | such
115 | than
116 | that
117 | that's
118 | the
119 | their
120 | theirs
121 | them
122 | themselves
123 | then
124 | there
125 | there's
126 | these
127 | they
128 | they'd
129 | they'll
130 | they're
131 | they've
132 | this
133 | those
134 | through
135 | to
136 | too
137 | under
138 | until
139 | up
140 | very
141 | was
142 | wasn't
143 | we
144 | we'd
145 | we'll
146 | we're
147 | we've
148 | were
149 | weren't
150 | what
151 | what's
152 | when
153 | when's
154 | where
155 | where's
156 | which
157 | while
158 | who
159 | who's
160 | whom
161 | why
162 | why's
163 | with
164 | won't
165 | would
166 | wouldn't
167 | you
168 | you'd
169 | you'll
170 | you're
171 | you've
172 | your
173 | yours
174 | yourself
175 | yourselves
176 |
--------------------------------------------------------------------------------
/lib/TextRank/Stopword/finnish-stopwords.txt:
--------------------------------------------------------------------------------
1 | aiemmin
2 | aika
3 | aikaa
4 | aikaan
5 | aikaisemmin
6 | aikaisin
7 | aikajen
8 | aikana
9 | aikoina
10 | aikoo
11 | aikovat
12 | aina
13 | ainakaan
14 | ainakin
15 | ainoa
16 | ainoat
17 | aiomme
18 | aion
19 | aiotte
20 | aist
21 | aivan
22 | ajan
23 | älä
24 | alas
25 | alemmas
26 | älköön
27 | alkuisin
28 | alkuun
29 | alla
30 | alle
31 | aloitamme
32 | aloitan
33 | aloitat
34 | aloitatte
35 | aloitattivat
36 | aloitettava
37 | aloitettevaksi
38 | aloitettu
39 | aloitimme
40 | aloitin
41 | aloitit
42 | aloititte
43 | aloittaa
44 | aloittamatta
45 | aloitti
46 | aloittivat
47 | alta
48 | aluksi
49 | alussa
50 | alusta
51 | annettavaksi
52 | annetteva
53 | annettu
54 | antaa
55 | antamatta
56 | antoi
57 | aoua
58 | apu
59 | asia
60 | asiaa
61 | asian
62 | asiasta
63 | asiat
64 | asioiden
65 | asioihin
66 | asioita
67 | asti
68 | avuksi
69 | avulla
70 | avun
71 | avutta
72 | edellä
73 | edelle
74 | edelleen
75 | edeltä
76 | edemmäs
77 | edes
78 | edessä
79 | edestä
80 | ehkä
81 | ei
82 | eikä
83 | eilen
84 | eivät
85 | eli
86 | ellei
87 | elleivät
88 | ellemme
89 | ellen
90 | ellet
91 | ellette
92 | emme
93 | en
94 | enää
95 | enemmän
96 | eniten
97 | ennen
98 | ensi
99 | ensimmäinen
100 | ensimmäiseksi
101 | ensimmäisen
102 | ensimmäisenä
103 | ensimmäiset
104 | ensimmäisiä
105 | ensimmäisiksi
106 | ensimmäisinä
107 | ensimmäistä
108 | ensin
109 | entinen
110 | entisen
111 | entisiä
112 | entistä
113 | entisten
114 | eräät
115 | eräiden
116 | eräs
117 | eri
118 | erittäin
119 | erityisesti
120 | esi
121 | esiin
122 | esillä
123 | esimerkiksi
124 | et
125 | eteen
126 | etenkin
127 | että
128 | ette
129 | ettei
130 | halua
131 | haluaa
132 | haluamatta
133 | haluamme
134 | haluan
135 | haluat
136 | haluatte
137 | haluavat
138 | halunnut
139 | halusi
140 | halusimme
141 | halusin
142 | halusit
143 | halusitte
144 | halusivat
145 | halutessa
146 | haluton
147 | hän
148 | häneen
149 | hänellä
150 | hänelle
151 | häneltä
152 | hänen
153 | hänessä
154 | hänestä
155 | hänet
156 | he
157 | hei
158 | heidän
159 | heihin
160 | heille
161 | heiltä
162 | heissä
163 | heistä
164 | heitä
165 | helposti
166 | heti
167 | hetkellä
168 | hieman
169 | huolimatta
170 | huomenna
171 | hyvä
172 | hyvää
173 | hyvät
174 | hyviä
175 | hyvien
176 | hyviin
177 | hyviksi
178 | hyville
179 | hyviltä
180 | hyvin
181 | hyvinä
182 | hyvissä
183 | hyvistä
184 | ihan
185 | ilman
186 | ilmeisesti
187 | itse
188 | itseään
189 | itsensä
190 | ja
191 | jää
192 | jälkeen
193 | jälleen
194 | jo
195 | johon
196 | joiden
197 | joihin
198 | joiksi
199 | joilla
200 | joille
201 | joilta
202 | joissa
203 | joista
204 | joita
205 | joka
206 | jokainen
207 | jokin
208 | joko
209 | joku
210 | jolla
211 | jolle
212 | jolloin
213 | jolta
214 | jompikumpi
215 | jonka
216 | jonkin
217 | jonne
218 | joo
219 | jopa
220 | jos
221 | joskus
222 | jossa
223 | josta
224 | jota
225 | jotain
226 | joten
227 | jotenkin
228 | jotenkuten
229 | jotka
230 | jotta
231 | jouduimme
232 | jouduin
233 | jouduit
234 | jouduitte
235 | joudumme
236 | joudun
237 | joudutte
238 | joukkoon
239 | joukossa
240 | joukosta
241 | joutua
242 | joutui
243 | joutuivat
244 | joutumaan
245 | joutuu
246 | joutuvat
247 | juuri
248 | kahdeksan
249 | kahdeksannen
250 | kahdella
251 | kahdelle
252 | kahdelta
253 | kahden
254 | kahdessa
255 | kahdesta
256 | kahta
257 | kahteen
258 | kai
259 | kaiken
260 | kaikille
261 | kaikilta
262 | kaikkea
263 | kaikki
264 | kaikkia
265 | kaikkiaan
266 | kaikkialla
267 | kaikkialle
268 | kaikkialta
269 | kaikkien
270 | kaikkin
271 | kaksi
272 | kannalta
273 | kannattaa
274 | kanssa
275 | kanssaan
276 | kanssamme
277 | kanssani
278 | kanssanne
279 | kanssasi
280 | kauan
281 | kauemmas
282 | kautta
283 | kehen
284 | keiden
285 | keihin
286 | keiksi
287 | keillä
288 | keille
289 | keiltä
290 | keinä
291 | keissä
292 | keistä
293 | keitä
294 | keittä
295 | keitten
296 | keneen
297 | keneksi
298 | kenellä
299 | kenelle
300 | keneltä
301 | kenen
302 | kenenä
303 | kenessä
304 | kenestä
305 | kenet
306 | kenettä
307 | kennessästä
308 | kerran
309 | kerta
310 | kertaa
311 | kesken
312 | keskimäärin
313 | ketä
314 | ketkä
315 | kiitos
316 | kohti
317 | koko
318 | kokonaan
319 | kolmas
320 | kolme
321 | kolmen
322 | kolmesti
323 | koska
324 | koskaan
325 | kovin
326 | kuin
327 | kuinka
328 | kuitenkaan
329 | kuitenkin
330 | kuka
331 | kukaan
332 | kukin
333 | kumpainen
334 | kumpainenkaan
335 | kumpi
336 | kumpikaan
337 | kumpikin
338 | kun
339 | kuten
340 | kuuden
341 | kuusi
342 | kuutta
343 | kyllä
344 | kymmenen
345 | kyse
346 | lähekkäin
347 | lähellä
348 | lähelle
349 | läheltä
350 | lähemmäs
351 | lähes
352 | lähinnä
353 | lähtien
354 | läpi
355 | liian
356 | liki
357 | lisää
358 | lisäksi
359 | luo
360 | mahdollisimman
361 | mahdollista
362 | me
363 | meidän
364 | meillä
365 | meille
366 | melkein
367 | melko
368 | menee
369 | meneet
370 | menemme
371 | menen
372 | menet
373 | menette
374 | menevät
375 | meni
376 | menimme
377 | menin
378 | menit
379 | menivät
380 | mennessä
381 | mennyt
382 | menossa
383 | mihin
384 | mikä
385 | mikään
386 | mikäli
387 | mikin
388 | miksi
389 | milloin
390 | minä
391 | minne
392 | minun
393 | minut
394 | missä
395 | mistä
396 | mitä
397 | mitään
398 | miten
399 | moi
400 | molemmat
401 | mones
402 | monesti
403 | monet
404 | moni
405 | moniaalla
406 | moniaalle
407 | moniaalta
408 | monta
409 | muassa
410 | muiden
411 | muita
412 | muka
413 | mukaan
414 | mukaansa
415 | mukana
416 | mutta
417 | muu
418 | muualla
419 | muualle
420 | muualta
421 | muuanne
422 | muulloin
423 | muun
424 | muut
425 | muuta
426 | muutama
427 | muutaman
428 | muuten
429 | myöhemmin
430 | myös
431 | myöskään
432 | myöskin
433 | myötä
434 | näiden
435 | näin
436 | näissä
437 | näissähin
438 | näissälle
439 | näissältä
440 | näissästä
441 | näitä
442 | nämä
443 | ne
444 | neljä
445 | neljää
446 | neljän
447 | niiden
448 | niin
449 | niistä
450 | niitä
451 | noin
452 | nopeammin
453 | nopeasti
454 | nopeiten
455 | nro
456 | nuo
457 | nyt
458 | ohi
459 | oikein
460 | ole
461 | olemme
462 | olen
463 | olet
464 | olette
465 | oleva
466 | olevan
467 | olevat
468 | oli
469 | olimme
470 | olin
471 | olisi
472 | olisimme
473 | olisin
474 | olisit
475 | olisitte
476 | olisivat
477 | olit
478 | olitte
479 | olivat
480 | olla
481 | olleet
482 | olli
483 | ollut
484 | oma
485 | omaa
486 | omaan
487 | omaksi
488 | omalle
489 | omalta
490 | oman
491 | omassa
492 | omat
493 | omia
494 | omien
495 | omiin
496 | omiksi
497 | omille
498 | omilta
499 | omissa
500 | omista
501 | on
502 | onkin
503 | onko
504 | ovat
505 | päälle
506 | paikoittain
507 | paitsi
508 | pakosti
509 | paljon
510 | paremmin
511 | parempi
512 | parhaillaan
513 | parhaiten
514 | peräti
515 | perusteella
516 | pian
517 | pieneen
518 | pieneksi
519 | pienellä
520 | pienelle
521 | pieneltä
522 | pienempi
523 | pienestä
524 | pieni
525 | pienin
526 | puolesta
527 | puolestaan
528 | runsaasti
529 | saakka
530 | sadam
531 | sama
532 | samaa
533 | samaan
534 | samalla
535 | samallalta
536 | samallassa
537 | samallasta
538 | saman
539 | samat
540 | samoin
541 | sata
542 | sataa
543 | satojen
544 | se
545 | seitsemän
546 | sekä
547 | sen
548 | seuraavat
549 | siellä
550 | sieltä
551 | siihen
552 | siinä
553 | siis
554 | siitä
555 | sijaan
556 | siksi
557 | sillä
558 | silloin
559 | silti
560 | sinä
561 | sinne
562 | sinua
563 | sinulle
564 | sinulta
565 | sinun
566 | sinussa
567 | sinusta
568 | sinut
569 | sisäkkäin
570 | sisällä
571 | sitä
572 | siten
573 | sitten
574 | suoraan
575 | suuntaan
576 | suuren
577 | suuret
578 | suuri
579 | suuria
580 | suurin
581 | suurten
582 | taa
583 | täällä
584 | täältä
585 | taas
586 | taemmas
587 | tähän
588 | tahansa
589 | tai
590 | takaa
591 | takaisin
592 | takana
593 | takia
594 | tällä
595 | tällöin
596 | tämä
597 | tämän
598 | tänä
599 | tänään
600 | tänne
601 | tapauksessa
602 | tässä
603 | tästä
604 | tätä
605 | täten
606 | tavalla
607 | tavoitteena
608 | täysin
609 | täytyvät
610 | täytyy
611 | te
612 | tietysti
613 | todella
614 | toinen
615 | toisaalla
616 | toisaalle
617 | toisaalta
618 | toiseen
619 | toiseksi
620 | toisella
621 | toiselle
622 | toiselta
623 | toisemme
624 | toisen
625 | toisensa
626 | toisessa
627 | toisesta
628 | toista
629 | toistaiseksi
630 | toki
631 | tosin
632 | tuhannen
633 | tuhat
634 | tule
635 | tulee
636 | tulemme
637 | tulen
638 | tulet
639 | tulette
640 | tulevat
641 | tulimme
642 | tulin
643 | tulisi
644 | tulisimme
645 | tulisin
646 | tulisit
647 | tulisitte
648 | tulisivat
649 | tulit
650 | tulitte
651 | tulivat
652 | tulla
653 | tulleet
654 | tullut
655 | tuntuu
656 | tuo
657 | tuolla
658 | tuolloin
659 | tuolta
660 | tuonne
661 | tuskin
662 | tykö
663 | usea
664 | useasti
665 | useimmiten
666 | usein
667 | useita
668 | uudeksi
669 | uudelleen
670 | uuden
671 | uudet
672 | uusi
673 | uusia
674 | uusien
675 | uusinta
676 | uuteen
677 | uutta
678 | vaan
679 | vähän
680 | vähemmän
681 | vähintään
682 | vähiten
683 | vai
684 | vaiheessa
685 | vaikea
686 | vaikean
687 | vaikeat
688 | vaikeilla
689 | vaikeille
690 | vaikeilta
691 | vaikeissa
692 | vaikeista
693 | vaikka
694 | vain
695 | välillä
696 | varmasti
697 | varsin
698 | varsinkin
699 | varten
700 | vasta
701 | vastaan
702 | vastakkain
703 | verran
704 | vielä
705 | vierekkäin
706 | vieri
707 | viiden
708 | viime
709 | viimeinen
710 | viimeisen
711 | viimeksi
712 | viisi
713 | voi
714 | voidaan
715 | voimme
716 | voin
717 | voisi
718 | voit
719 | voitte
720 | voivat
721 | vuoden
722 | vuoksi
723 | vuosi
724 | vuosien
725 | vuosina
726 | vuotta
727 | yhä
728 | yhdeksän
729 | yhden
730 | yhdessä
731 | yhtä
732 | yhtäällä
733 | yhtäälle
734 | yhtäältä
735 | yhtään
736 | yhteen
737 | yhteensä
738 | yhteydessä
739 | yhteyteen
740 | yksi
741 | yksin
742 | yksittäin
743 | yleensä
744 | ylemmäs
745 | yli
746 | ylös
747 | ympäri
748 |
--------------------------------------------------------------------------------
/lib/TextRank/Stopword/french-stopwords.txt:
--------------------------------------------------------------------------------
1 | alors
2 | au
3 | aucuns
4 | aussi
5 | autre
6 | avant
7 | avec
8 | avoir
9 | bon
10 | car
11 | ce
12 | cela
13 | ces
14 | ceux
15 | chaque
16 | ci
17 | comme
18 | comment
19 | dans
20 | des
21 | du
22 | dedans
23 | dehors
24 | depuis
25 | deux
26 | devrait
27 | doit
28 | donc
29 | dos
30 | droite
31 | début
32 | elle
33 | elles
34 | en
35 | encore
36 | essai
37 | est
38 | et
39 | eu
40 | fait
41 | faites
42 | fois
43 | font
44 | force
45 | haut
46 | hors
47 | ici
48 | il
49 | ils
50 | je juste
51 | la
52 | le
53 | les
54 | leur
55 | là
56 | ma
57 | maintenant
58 | mais
59 | mes
60 | mine
61 | moins
62 | mon
63 | mot
64 | même
65 | ni
66 | nommés
67 | notre
68 | nous
69 | nouveaux
70 | ou
71 | où
72 | par
73 | parce
74 | parole
75 | pas
76 | personnes
77 | peut
78 | peu
79 | pièce
80 | plupart
81 | pour
82 | pourquoi
83 | quand
84 | que
85 | quel
86 | quelle
87 | quelles
88 | quels
89 | qui
90 | sa
91 | sans
92 | ses
93 | seulement
94 | si
95 | sien
96 | son
97 | sont
98 | sous
99 | soyez
100 | sujet
101 | sur
102 | ta
103 | tandis
104 | tellement
105 | tels
106 | tes
107 | ton
108 | tous
109 | tout
110 | trop
111 | très
112 | tu
113 | valeur
114 | voie
115 | voient
116 | vont
117 | votre
118 | vous
119 | vu
120 | ça
121 | étaient
122 | état
123 | étions
124 | été
125 | être
126 |
--------------------------------------------------------------------------------
/lib/TextRank/Stopword/generate.php:
--------------------------------------------------------------------------------
1 | |
35 | +---------------------------------------------------------------------------------+
36 | */
37 | namespace crodas\TextRank;
38 |
39 | class Summary extends TextRank
40 | {
41 | public function getSummary($text)
42 | {
43 | $sentences = $this->config->trigger('get_sentences', $text);
44 | $candidates = [];
45 | $x= microtime(true);
46 | foreach ($sentences as $id => $t) {
47 | try {
48 | $words = $this->config->trigger('get_words', $t);
49 | $words = $this->config->trigger('filter_keywords', $words);
50 | $words = $this->config->trigger('normalize_keywords', $words);
51 | $words = array_filter($words, function($word) {
52 | return !ctype_punct($word);
53 | });
54 | $candidates[$id] = $words;
55 | } catch (\Exception $e) {
56 | }
57 | }
58 | $pr = new SummaryPageRank;
59 | $sorted = $pr->sort($candidates);
60 | $keys = array_slice($sorted, 0, ceil(count($sorted)*.05), true);
61 | $txt = "";
62 | foreach (array_keys($keys) as $key) {
63 | $txt .= $sentences[$key] . "\n";
64 | }
65 | return $txt;
66 | }
67 | }
68 |
--------------------------------------------------------------------------------
/lib/TextRank/SummaryPageRank.php:
--------------------------------------------------------------------------------
1 | |
35 | +---------------------------------------------------------------------------------+
36 | */
37 | namespace crodas\TextRank;
38 |
39 | use LanguageDetector\Sort\PageRank;
40 |
41 | class SummaryPageRank extends Pagerank
42 | {
43 | protected function getGraph(Array $sentences)
44 | {
45 | $outlinks = array();
46 | $graph = array();
47 | $values = array();
48 |
49 | $index = [];
50 | foreach($sentences as $id => $words) {
51 | foreach ($words as $word) {
52 | if (empty($index[$word])) {
53 | $index[$word] = [];
54 | }
55 | $index[$word][] = $id;
56 | }
57 | }
58 |
59 | foreach ($index as $word => $ids) {
60 | $ids = array_unique($ids);
61 | if (count($ids) == 1) continue;
62 | foreach ($ids as $source) {
63 | foreach ($ids as $target) {
64 | if ($source != $target) {
65 | if (empty($outlinks[$source])) {
66 | $outlinks[$source] = 0;
67 | }
68 | if (empty($graph[$target])) {
69 | $graph[$target] = array();
70 | }
71 | $outlinks[$source]++;
72 | $graph[$target][] = $source;
73 | $values[$target] = 0.15;
74 | }
75 | }
76 | }
77 | }
78 |
79 | return compact('graph', 'values', 'outlinks');
80 | }
81 | }
82 |
--------------------------------------------------------------------------------
/lib/TextRank/TextRank.php:
--------------------------------------------------------------------------------
1 | |
35 | +---------------------------------------------------------------------------------+
36 | */
37 | namespace crodas\TextRank;
38 |
39 | use LanguageDetector\Sort\PageRank;
40 |
41 | class TextRank
42 | {
43 | protected $config;
44 |
45 | public function __construct(Config $config)
46 | {
47 | $this->config = $config;
48 | }
49 |
50 | public function getAllKeywordsSorted($text)
51 | {
52 | // split the text into words
53 | $words = $this->config->trigger('get_words', $text);
54 |
55 | // get the candidates
56 | $keywords = $this->config->trigger('filter_keywords', $words);
57 |
58 | // normalize each candidate
59 | $normalized = $this->config->trigger('normalize_keywords', $keywords);
60 |
61 | if (count($keywords) != count($normalized)) {
62 | throw new \RuntimeException("{normalize_keywords} event returned invalid data");
63 | }
64 |
65 | $graph = new PageRank;
66 | $sorted = $graph->sort(array_values($normalized), true);
67 |
68 | if ($sorted == $normalized) {
69 | // PageRank failed, probably because the input was invalid
70 | return [];
71 | }
72 |
73 | $top = array_slice($sorted, 0, 10);
74 |
75 | // build an index of words and positions (so we can collapse compount keywords)
76 | $index = [];
77 | $pindex = [];
78 |
79 | // search for coumpounds keywords
80 | $prev = [];
81 | $phrases = [];
82 | foreach ($normalized as $pos => $word) {
83 | if (empty($top[$word])) {
84 | if (count($prev) > 1 && count($prev) < 4) {
85 | $phrases[] = $prev;
86 | }
87 | $prev = [];
88 | continue;
89 | }
90 | $prev[] = [$pos, $word];
91 | }
92 |
93 | if (count($prev) > 1 && count($prev) < 4) {
94 | $phrases[] = $prev;
95 | }
96 |
97 | foreach ($phrases as $prev) {
98 | $start = current($prev)[0];
99 | $end = end($prev)[0];
100 | $zwords = array_slice($words, $start, $end - $start+1, true);
101 | if (count(array_filter($zwords, 'ctype_punct')) > 0) {
102 | continue;
103 | }
104 | $phrase = implode(' ', $zwords);
105 | $score = 0;
106 | foreach ($prev as $word) {
107 | $score += $top[$word[1]];
108 | }
109 | $sorted[ trim($phrase) ] = $score/($end - $start);
110 | }
111 |
112 | // denormalize each single words
113 | foreach ($normalized as $pos => $word) {
114 | if (!empty($sorted[$word]) && $word != $words[$pos]) {
115 | $sorted[$words[$pos]] = $sorted[$word];
116 | unset($sorted[$word]);
117 | }
118 | }
119 |
120 | arsort($sorted);
121 |
122 | return $sorted;
123 | }
124 |
125 | public function getKeywords($text, $limit = 20)
126 | {
127 | return array_slice($this->getAllKeywordsSorted($text), 0, $limit);
128 | }
129 | }
130 |
131 |
--------------------------------------------------------------------------------
/phpunit.xml:
--------------------------------------------------------------------------------
1 |
2 |
3 |
4 |
21 |
22 |
23 |
24 | tests/
25 |
26 |
27 |
28 |
29 |
30 | lib/
31 | tests/tmp/
32 |
33 | lib/Dispatcher/Template
34 |
35 |
36 |
37 |
38 |
39 |
--------------------------------------------------------------------------------
/tests/QuickTest.php:
--------------------------------------------------------------------------------
1 | getKeywords($text);
23 | $i = 0;
24 | foreach ($expected as $word) {
25 | if ($word[0] == '*') {
26 | $word = substr($word, 1);
27 | }
28 | if (!empty($keywords[$word])) {
29 | $i++;
30 | }
31 | }
32 | $this->AssertTrue($i > 0);
33 | }
34 |
35 | /** @dataProvider provider */
36 | public function testSentences($text, $expected, $esummary)
37 | {
38 | $config = new \crodas\TextRank\Config;
39 | $config->addListener(new \crodas\TextRank\Stopword);
40 | $analizer = new \crodas\TextRank\Summary($config);
41 | $summary = $analizer->getSummary($text);
42 |
43 | $this->assertTrue(strpos($summary, $esummary) !== false, "Expected: $summary");
44 | }
45 |
46 | /**
47 | * @dataProvider provider
48 | */
49 | public function testGetkeywords($text, $expected)
50 | {
51 | $config = new \crodas\TextRank\Config;
52 | $config->addListener(new \crodas\TextRank\Stopword);
53 |
54 | $analizer = new \crodas\TextRank\TextRank($config);
55 | $keywords = $analizer->getKeywords($text);
56 | foreach ($expected as $word) {
57 | $catch = false;
58 | if ($word[0] == '*') {
59 | $catch = true;
60 | $word = substr($word, 1);
61 | }
62 | try {
63 | $this->assertTrue(!empty($keywords[$word]), "cannot find \"$word\"");
64 | } catch (\Exception $e) {
65 | if (!$catch) throw $e;
66 | }
67 | }
68 | }
69 |
70 | }
71 |
--------------------------------------------------------------------------------
/tests/bootstrap.php:
--------------------------------------------------------------------------------
1 |