├── .gitignore ├── .vscode └── settings.json ├── data ├── dusty.txt ├── numbers.txt ├── thoughtco.txt ├── ku.txt ├── teachingtreasures.txt ├── singularis.txt └── parsers.ipynb ├── setup.py ├── README.md ├── LICENSE.txt └── similar_sounding_words.py /.gitignore: -------------------------------------------------------------------------------- 1 | parsers-checkpoint.ipynb 2 | **/__pycache__/* 3 | dist 4 | build 5 | *.egg-info -------------------------------------------------------------------------------- /.vscode/settings.json: -------------------------------------------------------------------------------- 1 | { 2 | "python.dataScience.maxOutputSize": 100, 3 | "python.dataScience.textOutputLimit": 200, 4 | "python.formatting.provider": "black" 5 | } -------------------------------------------------------------------------------- /data/dusty.txt: -------------------------------------------------------------------------------- 1 | accepting,excepting 2 | an,and,end 3 | are,r 4 | at,add,ad 5 | create,crate 6 | drying,trying 7 | fat,vat 8 | fail,feel 9 | grade,grate,great,grid 10 | peer,pier,pure,appear 11 | peers,piers 12 | poll,paul,pull,pole 13 | rap,wrap 14 | rapper,wrapper 15 | rust,rest 16 | right,rate 17 | sink,sync 18 | well,we'll,wheel,while,will -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- 1 | import setuptools 2 | 3 | with open("README.md", "r") as fh: 4 | long_description = fh.read() 5 | 6 | 7 | setuptools.setup( 8 | name="similar-sounding-words", 9 | version="0.1.1", 10 | description="A list of similar sounding words to help disambiguate voice coding", 11 | long_description=long_description, 12 | long_description_content_type="text/markdown", 13 | url="https://github.com/dusty-phillips/similar-sounding-words", 14 | py_modules=["similar_sounding_words"], 15 | classifiers=[ 16 | "Programming Language :: Python :: 3", 17 | "License :: OSI Approved :: MIT License", 18 | "Operating System :: OS Independent", 19 | "Intended Audience :: Developers", 20 | ], 21 | python_requires=">=3.8", 22 | ) 23 | -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- 1 | # Similar sounding words 2 | 3 | This is a list of similar sounding words that I have collected from various sources on the web 4 | and added to as I find new pairs. 5 | 6 | Unlike most homophone, homograph, and homonym resources this list is not targeting 7 | ESL or educational use. Instead it is designed for finding common errors in speech recognition texts. 8 | Specifically I use it with [Caster](https://caster.readthedocs.io/en/latest/) for voice programming. 9 | 10 | In addition to my custom file I currently have five different sources: 11 | * https://7esl.com/homophones/ 12 | * https://web.ku.edu/~edit/wordsall.html 13 | * http://www.singularis.ltd.uk/bifroest/misc/homophones-list.html 14 | * https://www.teachingtreasures.com.au/teaching-tools/Basic-worksheets/worksheets-english/upper/homophones-list.htm 15 | * https://www.thoughtco.com/homonyms-homophones-and-homographs-a-b-1692660 16 | 17 | I preprocessed some of these files in a text editor and 18 | random three Jupiter notebook available in the github repository 19 | to generate the index. 20 | 21 | All source files are copyright their respective authors. 22 | 23 | ## TODO 24 | * add mapping of words to numbers -------------------------------------------------------------------------------- /LICENSE.txt: -------------------------------------------------------------------------------- 1 | Copyright (c) 2020 Dusty Phillips 2 | 3 | Permission is hereby granted, free of charge, to any person obtaining a copy 4 | of this software and associated documentation files (the "Software"), to deal 5 | in the Software without restriction, including without limitation the rights 6 | to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 7 | copies of the Software, and to permit persons to whom the Software is 8 | furnished to do so, subject to the following conditions: 9 | 10 | The above copyright notice and this permission notice shall be included in all 11 | copies or substantial portions of the Software. 12 | 13 | THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 14 | IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 15 | FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 16 | AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 17 | LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 18 | OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE 19 | SOFTWARE. 20 | 21 | The source data files are copyright their respective authors. -------------------------------------------------------------------------------- /data/numbers.txt: -------------------------------------------------------------------------------- 1 | 0,zero 2 | 1,one 3 | 2,two 4 | 3,three 5 | 4,four 6 | 5,five 7 | 6,six 8 | 7,seven 9 | 8,eight 10 | 9,nine 11 | 10,ten 12 | 11,eleven 13 | 12,twelve 14 | 13,thirteen 15 | 14,fourteen 16 | 15,fifteen 17 | 16,sixteen 18 | 17,seventeen 19 | 18,eighteen 20 | 19,nineteen 21 | 20,twenty 22 | 21,twenty-one 23 | 22,twenty-two 24 | 23,twenty-three 25 | 24,twenty-four 26 | 25,twenty-five 27 | 26,twenty-six 28 | 27,twenty-seven 29 | 28,twenty-eight 30 | 29,twenty-nine 31 | 30,thirty 32 | 31,thirty-one 33 | 32,thirty-two 34 | 33,thirty-three 35 | 34,thirty-four 36 | 35,thirty-five 37 | 36,thirty-six 38 | 37,thirty-seven 39 | 38,thirty-eight 40 | 39,thirty-nine 41 | 40,forty 42 | 41,forty-one 43 | 42,forty-two 44 | 43,forty-three 45 | 44,forty-four 46 | 45,forty-five 47 | 46,forty-six 48 | 47,forty-seven 49 | 48,forty-eight 50 | 49,forty-nine 51 | 50,fifty 52 | 51,fifty-one 53 | 52,fifty-two 54 | 53,fifty-three 55 | 54,fifty-four 56 | 55,fifty-five 57 | 56,fifty-six 58 | 57,fifty-seven 59 | 58,fifty-eight 60 | 59,fifty-nine 61 | 60,sixty 62 | 61,sixty-one 63 | 62,sixty-two 64 | 63,sixty-three 65 | 64,sixty-four 66 | 65,sixty-five 67 | 66,sixty-six 68 | 67,sixty-seven 69 | 68,sixty-eight 70 | 69,sixty-nine 71 | 70,seventy 72 | 71,seventy-one 73 | 72,seventy-two 74 | 73,seventy-three 75 | 74,seventy-four 76 | 75,seventy-five 77 | 76,seventy-six 78 | 77,seventy-seven 79 | 78,seventy-eight 80 | 79,seventy-nine 81 | 80,eighty 82 | 81,eighty-one 83 | 82,eighty-two 84 | 83,eighty-three 85 | 84,eighty-four 86 | 85,eighty-five 87 | 86,eighty-six 88 | 87,eighty-seven 89 | 88,eighty-eight 90 | 89,eighty-nine 91 | 90,ninety 92 | 91,ninety-one 93 | 92,ninety-two 94 | 93,ninety-three 95 | 94,ninety-four 96 | 95,ninety-five 97 | 96,ninety-six 98 | 97,ninety-seven 99 | 98,ninety-eight 100 | 99,ninety-nine 101 | 100,one hundred -------------------------------------------------------------------------------- /data/thoughtco.txt: -------------------------------------------------------------------------------- 1 | # https://www.thoughtco.com/homonyms-homophones-and-homographs-a-b-1692660 2 | accept except 3 | ad add 4 | advice advise 5 | aid aide 6 | ail ale 7 | air ere heir 8 | aisle I'll isle 9 | allusion illusion 10 | altar alter 11 | ate eight 12 | bail bail bale 13 | band band banned 14 | bare bear bear 15 | bases bases basis 16 | beat beat beet 17 | blew blue 18 | bread bred 19 | buy by bye 20 | capital capital capitol 21 | ceiling sealing 22 | cell sell 23 | cent scent sent 24 | cereal serial 25 | chews choose 26 | Chile chili chilly 27 | chord cord 28 | cite site sight 29 | close clothes 30 | coarse course 31 | complement compliment 32 | council counsel 33 | creak creek 34 | crews cruise 35 | days daze 36 | dear deer 37 | desert desert dessert 38 | dew do due 39 | die dye 40 | discreet discrete 41 | doe dough 42 | dual duel 43 | elicit illicit 44 | eminent imminent 45 | ewe you 46 | eye I 47 | facts fax 48 | fair fare 49 | fairy ferry 50 | faze phase 51 | feat feet 52 | find fined 53 | fir fur 54 | flea flee 55 | flew flu 56 | flour flower 57 | for fore four forth fourth 58 | foreword forward 59 | gene jean 60 | gorilla guerrilla 61 | grease Greece 62 | groan grown 63 | hair hare 64 | hall haul 65 | halve have 66 | hay hey 67 | heal heel 68 | hear here 69 | hi high 70 | hoarse horse 71 | hole whole 72 | holey holy wholly 73 | hoarse horse 74 | hour our 75 | knead need 76 | knew new 77 | knight night 78 | knot not 79 | know no 80 | lead led 81 | leased least 82 | lessen lesson 83 | loan lone 84 | made maid 85 | mail male 86 | marry material merry materiel 87 | meat meet 88 | mince mints 89 | morning mourning 90 | none nun 91 | oar or ore oh owe 92 | one won 93 | overdo overdue 94 | pail pale 95 | pain pane 96 | peace piece 97 | peak peek 98 | patience patients 99 | pear pair 100 | plain plane 101 | pole poll 102 | poor pour 103 | pray prey 104 | principal principle 105 | rain rein 106 | rap wrap 107 | read red 108 | real reel 109 | right write 110 | ring wring 111 | road rode 112 | role roll 113 | rose rows 114 | sail sale 115 | scene seen 116 | sea see 117 | seam seem 118 | sew so sow soar sore 119 | sole soul 120 | son sun 121 | some sum 122 | stair stare 123 | steal steel 124 | suite sweet 125 | tail tale 126 | their there they're 127 | threw through 128 | to too two toe tow 129 | vary very 130 | wail whale 131 | waist waste 132 | wait weight 133 | war wore 134 | warn worn 135 | way weigh 136 | we wee 137 | weak week 138 | wear where 139 | weather whether 140 | which witch 141 | wood would 142 | your you're 143 | -------------------------------------------------------------------------------- /data/ku.txt: -------------------------------------------------------------------------------- 1 | #https://web.ku.edu/~edit/wordsall.html 2 | adapt;adept;adopt 3 | advice;advise 4 | aerie;airy;eerie 5 | aid;aide 6 | aisle;isle;I'll 7 | alley;ally 8 | allready;already 9 | allusion;illusion 10 | appraise;apprise 11 | arc;ark 12 | ascent;assent 13 | assay;essay 14 | bring;take 15 | auger;augur 16 | bail;bale 17 | breach;breech 18 | bazaar;bizarre 19 | bloc;block 20 | born;borne 21 | borough;burro;burrow 22 | bouillon;bullion 23 | braise;braze 24 | broach;brooch 25 | cannon;canon 26 | caster;castor 27 | censor;censer;censure 28 | chaste;chased 29 | chic;sheik 30 | cite;site;sight 31 | confident;confidant 32 | deprivation;depravation 33 | desperate;disparate 34 | disperse;disburse 35 | dual;duel 36 | ecology;environment 37 | either;each 38 | elicit;illicit 39 | elude;allude 40 | epic;epoch 41 | exceed;accede 42 | excess;access 43 | extant;extent 44 | faint;feint 45 | fair;fare 46 | faze;phase 47 | feign;fain 48 | fete;feat 49 | fir;fur 50 | flair;flare 51 | flea;flee 52 | floe;flow 53 | flu;flue;flew 54 | forbear;forebear 55 | formally;formerly 56 | forth;fourth 57 | forward;foreword 58 | foul;fowl 59 | frank;franc 60 | freeze;frieze 61 | friar;fryer 62 | gaff;gaffe 63 | gait;gate 64 | gauge;gage 65 | gel;jell 66 | genius;genus 67 | gild;guild 68 | gilt;guilt 69 | gist;jest 70 | glacier;glazier 71 | gnaw;naw 72 | gorilla;guerrilla 73 | groan;grown 74 | guarantee;guaranty 75 | hair;hare 76 | handsome;hansom 77 | hanger;hangar 78 | harrier;hairier 79 | hart;heart 80 | hay;hey 81 | hew;hue 82 | hoard;horde 83 | holy;wholly;holey 84 | hoop;whoop 85 | hostile;hostel 86 | humorous;humerus 87 | hurdle;hurtle 88 | hypocritical;hypercritical 89 | idle;idol;idyll 90 | incite;insight 91 | incredible;incredulous 92 | inequity;iniquity 93 | ingenious;ingenuous 94 | interstate;intrastate 95 | jam;jamb 96 | jealousy;jalousie 97 | judicial;judicious 98 | kill;kiln 99 | knave;nave 100 | knead;need;kneed 101 | knit;nit 102 | lamb;lam 103 | lay;lei 104 | lea;lee 105 | lead;led 106 | leak;leek 107 | lean;lien 108 | leech;leach 109 | lesser;lessor 110 | levy;levee 111 | liable;libel 112 | liken;lichen 113 | links;lynx 114 | literal;littoral 115 | llama;lama 116 | load;lode 117 | loan;lone 118 | loop;loupe 119 | lute;loot 120 | mackintosh;McIntosh;Macintosh 121 | magnet;magnate 122 | magnificent;munificent 123 | mall;maul 124 | mannequin;manikin 125 | manner;manor 126 | mantel;mantle 127 | marshal;martial;Marshall;marital 128 | martin;marten;Martian 129 | mask;masque 130 | material;materiel 131 | maze;maize 132 | mean;mien 133 | meat;meet;mete 134 | medal;meddle 135 | median;average;normal 136 | metal;mettle;meddle 137 | mews;muse 138 | might;mite 139 | mill;mil 140 | millinery;millinary 141 | miner;minor 142 | moan;mown 143 | moat;mote 144 | moose;mousse 145 | morn;mourn 146 | mule;mewl 147 | mutton;mouton 148 | muscle;mussel;muzzle 149 | nay;neigh 150 | official;officious 151 | oracle;auricle 152 | oscillate;osculate 153 | ought;aught 154 | overdo;overdue 155 | overseas;oversees 156 | pail;pale 157 | pain;pane 158 | pair;pear;pare 159 | palate;palette;pallet 160 | pall;pawl 161 | parameter;perimeter 162 | parish;perish 163 | peak;peek;pique 164 | peal;peel 165 | pearl;purl 166 | pedal;peddle 167 | peer;pier 168 | peon;paean 169 | peremptory;pre-emptory 170 | perquisite;prerequisite 171 | persecute;prosecute 172 | personal;personnel 173 | perspective;prospective 174 | petty;petit;petite 175 | physic;physique;psychic 176 | pica;pika 177 | place;plaice 178 | plate;plait 179 | plum;plumb 180 | pole;poll 181 | policy;polity 182 | populace;populous 183 | popular;poplar 184 | poultry;paltry 185 | pour;pore 186 | pray;prey 187 | precede;proceed 188 | prescribe;proscribe 189 | presentment;presentiment 190 | profit;prophet 191 | prophecy;prophesy 192 | propose;purpose 193 | prone;supine 194 | prostrate;prostate 195 | put;putt 196 | queue;cue 197 | quire;choir 198 | rack;wrack 199 | rain;reign;rein 200 | raise;raze 201 | rap;wrap;rapt 202 | read;reed 203 | real;reel 204 | reality;realty 205 | reek;wreak 206 | register;registrar 207 | reluctant;reticent 208 | rest;wrest 209 | retch;wretch 210 | review;revue 211 | riffle;rifle 212 | rigor;rigger 213 | ring;wring 214 | rite;right;write 215 | road;rode;rowed 216 | roe;rho;row 217 | room;rheum 218 | root;route 219 | rote;wrote 220 | rough;ruff 221 | royal;roil 222 | rude;rood;rued 223 | ruin;rune 224 | rung;wrung 225 | rye;wry 226 | sachet;sashay 227 | sail;sale 228 | sanitorium;sanitarium 229 | scene;seen 230 | scull;skull 231 | seam;seem 232 | seaman;semen 233 | sear;seer;sere 234 | seed;cede 235 | seine;sane 236 | seller;cellar 237 | serf;surf 238 | serge;surge 239 | session;cession 240 | shanty;chantey 241 | shear;sheer 242 | shoe;shoo 243 | sick;sic 244 | sign;sine 245 | signet;cygnet 246 | slay;sleigh 247 | slight;sleight 248 | slow;sloe 249 | soar;sore 250 | sole;soul;sol 251 | some;sum 252 | spore;spoor 253 | step;steppe 254 | straight;strait 255 | style;stile;sty 256 | suit;suite 257 | summary;summery 258 | sword;sward;soared 259 | symbol;cymbal 260 | tacit;tacet 261 | tail;tale 262 | talisman;talesman 263 | taper;tapir 264 | tasty;tasteful 265 | taught;taut 266 | taupe;tope 267 | tea;tee 268 | team;teem 269 | tear;tare;tier 270 | threw;through 271 | throw;throe 272 | thrown;throne 273 | time;thyme 274 | ton;tun 275 | tool;tulle 276 | tortuous;torturous 277 | tough;tuff 278 | toxin;tocsin 279 | track;tract 280 | tray;trey 281 | troop;troupe 282 | trustee;trusty 283 | turban;turbine 284 | turn;tern 285 | undo;undue 286 | up;upped 287 | urn;earn 288 | vain;vane;vein 289 | valance;valence 290 | vale;veil 291 | veracious;voracious 292 | waive;wave 293 | wet;whet 294 | vial;vile;viol 295 | vice;vise 296 | vicious;viscous;viscus 297 | villain;villein 298 | virtue;virtu 299 | wail;wale 300 | wane;wain 301 | want;wont 302 | wean;ween 303 | wear;ware 304 | weather;wether;whether 305 | whither;wither 306 | worst;wurst 307 | yew;ewe;you 308 | yoke;yolk -------------------------------------------------------------------------------- /data/teachingtreasures.txt: -------------------------------------------------------------------------------- 1 | # https://www.teachingtreasures.com.au/teaching-tools/Basic-worksheets/worksheets-english/upper/homophones-list.htm 2 | Ad Add 3 | Aerie Airy 4 | Ail Ale 5 | Air Heir 6 | Aisle Isle 7 | All Awl 8 | Allowed Aloud 9 | Altar Alter 10 | Arc Ark 11 | Ascent Assent 12 | Ate Eight 13 | Attendance Attendants 14 | Aural Oral 15 | Axes Axis 16 | Aye Eye 17 | Bail Bale 18 | Baited Bated 19 | Bald Bawled 20 | Ball Bawl 21 | Band Banned 22 | Bard Barred 23 | Bare Bear 24 | Baron Barren 25 | Base Bass 26 | Based Baste 27 | Be Bee 28 | Beach Beech 29 | Beat Beet 30 | Beau Bow 31 | Beer Bier 32 | Bell Belle 33 | Berry Bury 34 | Berth Birth 35 | Billed Build 36 | Blew Blue 37 | Bloc Block 38 | Boar Bore 39 | Board Bored 40 | Boarder Border 41 | Bold Bowled 42 | Bolder Boulder 43 | Bootie Booty 44 | Born Borne 45 | Bough Bow 46 | Braid Brayed 47 | Brake Break 48 | Bread Bred 49 | Brewed Brood 50 | Brews Bruise 51 | Bridal Bridle 52 | Broach Brooch 53 | Brows Browse 54 | Burro Burrow 55 | But Butt 56 | Buy Bye 57 | Caddie Caddy 58 | Callous Callus 59 | Canon Cannon 60 | Canter Cantor 61 | Canvas Canvass 62 | Capital Capitol 63 | Carat Carrot 64 | Carol Carrel 65 | Cast Caste 66 | Cede Seed 67 | Ceiling Sealing 68 | Cell Sell 69 | Cellar Seller 70 | Censor Sensor 71 | Cent Scent 72 | Cereal Serial 73 | Cession Session 74 | Chance Chants 75 | Chased Chaste 76 | Cheap Cheep 77 | Chews Choose 78 | Chic Sheik 79 | Chilli Chilly 80 | Choir Quire 81 | Choral Coral 82 | Chord Cored 83 | Chute Shoot 84 | Cite Sight 85 | Clause Claws 86 | Close Clothes 87 | Coarse Course 88 | Colonel Kernel 89 | Complement Compliment 90 | Council Counsel 91 | Coward Cowered 92 | Creak Creek 93 | Crewel Cruel 94 | Crews Cruise 95 | Cue Queue 96 | Currant Current 97 | Cygnet Signet 98 | Cymbal Symbol 99 | Dam Damn 100 | Days Daze 101 | Dear Deer 102 | Dense Dents 103 | Desert Dessert 104 | Dew Due 105 | Die Dye 106 | Disburse Disperse 107 | Discreet Discrete 108 | Doe Dough 109 | Does Doze 110 | Done Dun 111 | Dual Duel 112 | Dyeing Dying 113 | Earn Urn 114 | Eave Eve 115 | Eek Eke 116 | Eight Ate 117 | Ewe You 118 | Ewes Yews 119 | Eye Aye 120 | Eyelet Islet 121 | Faint Feint 122 | Fair Fare 123 | Faun Fawn 124 | Faze Phase 125 | Feat Feet 126 | Fined Find 127 | Fir Fur 128 | Fisher Fissure 129 | Flair Flare 130 | Flea Flee 131 | Flew Flue 132 | Floe Flow 133 | Flour Flower 134 | Foaled Fold 135 | For Four 136 | Foreword Forward 137 | Forth Fourth 138 | Foul Fowl 139 | Franc Frank 140 | Frays Phrase 141 | Freeze Frieze 142 | Friar Fryer 143 | Gaff Gaffe 144 | Gait Gate 145 | Gamble Gambol 146 | Genes Jeans 147 | Gibe Jibe 148 | Gild Guild 149 | Gilt Guilt 150 | Gofer Gopher 151 | Gorilla Guerrilla 152 | Gourd Gored 153 | Grate Great 154 | Grill Grille 155 | Grisly Grizzly 156 | Groan Grown 157 | Guessed Guest 158 | Guise Guys 159 | Hail Hale 160 | Hair Hare 161 | Hall Haul 162 | Hangar Hanger 163 | Hart Heart 164 | Hay Hey 165 | Heal Heel 166 | Hear Here 167 | Heard Herd 168 | Heir Air 169 | Heroin Heroine 170 | Hew Hue 171 | Hi High 172 | Him Hymn 173 | Ho Hoe 174 | Hoard Horde 175 | Hoarse Horse 176 | Hoes Hose 177 | Hole Whole 178 | Holy Wholly 179 | Hostel Hostile 180 | Hour Our 181 | Idle Idol 182 | In Inn 183 | Incidence Incidents 184 | Intense Intents 185 | Isle Aisle 186 | Islet Eyelet 187 | Jam Jamb 188 | Jeans Genes 189 | Jibe Gibe 190 | Kernel Colonel 191 | Knave Nave 192 | Knead Need 193 | Knew New 194 | Knew New 195 | Knight Night 196 | Knit Nit 197 | Knot Not 198 | Know No 199 | Knows Nose 200 | Lacks Lax 201 | Lain Lane 202 | Lama Llama 203 | Laps Lapse 204 | Lay Lei 205 | Leach Leech 206 | Lead Led 207 | Leak Leek 208 | Lean Lien 209 | Leased Least 210 | Lessen Lesson 211 | Levee Levy 212 | Lie Lye 213 | Links Lynx 214 | Lo Low 215 | Load Lode 216 | Loan Lone 217 | Locks Lox 218 | Loot Lute 219 | Made Maid 220 | Mail Male 221 | Main Mane 222 | Maize Maze 223 | Mall Maul 224 | Manner Manor 225 | Mantel Mantle 226 | Marshal Martial 227 | Mask Masque 228 | Massed Mast 229 | Meat Meet 230 | Medal Meddle 231 | Metal Mettle 232 | Mewl Mule 233 | Mews Muse 234 | Might Mite 235 | Mince Mints 236 | Mind Mined 237 | Miner Minor 238 | Missal Missile 239 | Missed Mist 240 | Moan Mown 241 | Moose Mousse 242 | Morning Mourning 243 | Muscle Mussel 244 | Mustard Mustered 245 | Naval Navel 246 | Nave Knave 247 | Nay Neigh 248 | Need Knead 249 | New Gnu 250 | Nicks Nix 251 | Night Knight 252 | Nit Knit 253 | No Know 254 | None Nun 255 | Nose Knows 256 | Not Knot 257 | Oar Ore 258 | Ode Owed 259 | Oh Owe 260 | One Won 261 | Oral Aural 262 | Our Hour 263 | Paced Paste 264 | Packed Pact 265 | Pail Pale 266 | Pain Pane 267 | Pair Pear 268 | Palette Pallet 269 | Passed Past 270 | Patience Patients 271 | Pause Paws 272 | Peace Piece 273 | Peak Peek 274 | Peal Peel 275 | Pearl Purl 276 | Pedal Peddle 277 | Peer Pier 278 | Phase Faze 279 | Phrase Frays 280 | Plain Plane 281 | Plait Plate 282 | Pleas Please 283 | Plum Plumb 284 | Pole Poll 285 | Pore Pour 286 | Praise Prays 287 | Presence Presents 288 | Pride Pried 289 | Pries Prize 290 | Primer Primmer 291 | Prince Prints 292 | Principal Principle 293 | Profit Prophet 294 | Quarts Quartz 295 | Queue Cue 296 | Quire Choir 297 | Rabbet Rabbit 298 | Rain Reign 299 | Raise Rays 300 | Rap Wrap 301 | Rapt Wrapped 302 | Read Reed 303 | Real Reel 304 | Red Read 305 | Reek Wreak 306 | Residence Residents 307 | Rest Wrest 308 | Retch Wretch 309 | Review Revue 310 | Right Write 311 | Ring Wring 312 | Road Rowed 313 | Roe Row 314 | Role Roll 315 | Roomer Rumour 316 | Root Route 317 | Rose Rows 318 | Rote Wrote 319 | Rouse Rows 320 | Rude Rued 321 | Rung Wrung 322 | Rye Wry 323 | Sac Sack 324 | Sail Sale 325 | Sane Seine 326 | Saver Savour 327 | Scene Seen 328 | Scent Sent 329 | Scull Skull 330 | Sea See 331 | Sealing Ceiling 332 | Seam Seem 333 | Seas Seize 334 | Seed Cede 335 | Sell Cell 336 | Seller Cellar 337 | Sensor Censor 338 | Serf Surf 339 | Serge Surge 340 | Serial Cereal 341 | Session Cession 342 | Sew Sow 343 | Shearn Sheer 344 | Sheik Chic 345 | Shoe Shoo 346 | Shone Shown 347 | Shoot Chute 348 | Sic Sick 349 | Side Sighed 350 | Sighs Size 351 | Sight Cite 352 | Signet Cygnet 353 | Slay Sleigh 354 | Sleight Slight 355 | Soar Sore 356 | Soared Sword 357 | Sole Soul 358 | Soled Sold 359 | Some Sum 360 | Son Sun 361 | Staid Stayed 362 | Stairs Stares 363 | Stake Steak 364 | Stationary Stationery 365 | Steal Steel 366 | Step Steppe 367 | Stile Style 368 | Straight Strait 369 | Succour Sucker 370 | Suite Sweet 371 | Symbol Cymbal 372 | Tacked Tact 373 | Tacks Tax 374 | Tail Tale 375 | Taper Tapir 376 | Taught Taut 377 | Tea Tee 378 | Team Teem 379 | Tear Tier 380 | Teas Tease 381 | Tense Tents 382 | Tern Turn 383 | Their There 384 | Threw Through 385 | Throes Throws 386 | Throne Thrown 387 | Thyme Time 388 | Tic Tick 389 | Tide Tied 390 | Toad Towed 391 | Toe Tow 392 | Told Tolled 393 | Too Two 394 | Tracked Tract 395 | Troop Troupe 396 | Trussed Trust 397 | Undo Undue 398 | Urn Earn 399 | Use Yews 400 | Vain Vein 401 | Vale Veil 402 | Vice Vise 403 | Wade Weighed 404 | Waist Waste 405 | Wait Weight 406 | Waive Wave 407 | Wares Wears 408 | Warn Worn 409 | Way Weigh 410 | We Wee 411 | Weak Week 412 | Whole Hole 413 | Wholly Holy 414 | Won One 415 | Wood Would 416 | Wrap Rap 417 | Wrapped Rapped 418 | Wreak Reek 419 | Wrest Rest 420 | Wretch Retch 421 | Wring Ring 422 | Write Right 423 | Wrote Rote 424 | Wrung Rung 425 | Wry Rye 426 | 427 | -------------------------------------------------------------------------------- /data/singularis.txt: -------------------------------------------------------------------------------- 1 | # http://www.singularis.ltd.uk/bifroest/misc/homophones-list.html 2 | accessary, accessory 3 | ad, add 4 | ail, ale 5 | air, heir 6 | aisle, I'll, isle 7 | all, awl 8 | allowed, aloud 9 | alms, arms 10 | altar, alter 11 | arc, ark 12 | aren't, aunt 13 | ate, eight 14 | auger, augur 15 | auk, orc 16 | aural, oral 17 | away, aweigh 18 | awe, oar, or, ore 19 | axel, axle 20 | aye, eye, I 21 | bail, bale 22 | bait, bate 23 | baize, bays 24 | bald, bawled 25 | ball, bawl 26 | band, banned 27 | bard, barred 28 | bare, bear 29 | bark, barque 30 | baron, barren 31 | base, bass 32 | bay, bey 33 | bazaar, bizarre 34 | be, bee 35 | beach, beech 36 | bean, been 37 | beat, beet 38 | beau, bow 39 | beer, bier 40 | bel, bell, belle 41 | berry, bury 42 | berth, birth 43 | bight, bite, byte 44 | billed, build 45 | bitten, bittern 46 | blew, blue 47 | bloc, block 48 | boar, bore 49 | board, bored 50 | boarder, border 51 | bold, bowled 52 | boos, booze 53 | born, borne 54 | bough, bow 55 | boy, buoy 56 | brae, bray 57 | braid, brayed 58 | braise, brays, braze 59 | brake, break 60 | bread, bred 61 | brews, bruise 62 | bridal, bridle 63 | broach, brooch 64 | bur, burr 65 | but, butt 66 | buy, by, bye 67 | buyer, byre 68 | calendar, calender 69 | call, caul 70 | canvas, canvass 71 | cast, caste 72 | caster, castor 73 | caught, court 74 | caw, core, corps 75 | cede, seed 76 | ceiling, sealing 77 | cell, sell 78 | censer, censor, sensor 79 | cent, scent, sent 80 | cereal, serial 81 | cheap, cheep 82 | check, cheque 83 | choir, quire 84 | chord, cord 85 | cite, sight, site 86 | clack, claque 87 | clew, clue 88 | climb, clime 89 | close, cloze 90 | coal, kohl 91 | coarse, course 92 | coign, coin 93 | colonel, kernel 94 | complacent, complaisant 95 | complement, compliment 96 | coo, coup 97 | cops, copse 98 | council, counsel 99 | cousin, cozen 100 | creak, creek 101 | crews, cruise 102 | cue, kyu, queue 103 | curb, kerb 104 | currant, current 105 | cymbol, symbol 106 | dam, damn 107 | days, daze 108 | dear, deer 109 | descent, dissent 110 | desert, dessert 111 | deviser, divisor 112 | dew, due 113 | die, dye 114 | discreet, discrete 115 | doe, doh, dough 116 | done, dun 117 | douse, dowse 118 | draft, draught 119 | dual, duel 120 | earn, urn 121 | eery, eyrie 122 | ewe, yew, you 123 | faint, feint 124 | fah, far 125 | fair, fare 126 | farther, father 127 | faun, fawn 128 | fay, fey 129 | faze, phase 130 | feat, feet 131 | ferrule, ferule 132 | few, phew 133 | fie, phi 134 | file, phial 135 | find, fined 136 | fir, fur 137 | fizz, phiz 138 | flair, flare 139 | flaw, floor 140 | flea, flee 141 | flex, flecks 142 | flew, flu, flue 143 | floe, flow 144 | flour, flower 145 | foaled, fold 146 | for, fore, four 147 | foreword, forward 148 | fort, fought 149 | forth, fourth 150 | foul, fowl 151 | franc, frank 152 | freeze, frieze 153 | friar, fryer 154 | furs, furze 155 | gait, gate 156 | galipot, gallipot 157 | gallop, galop 158 | gamble, gambol 159 | gays, gaze 160 | genes, jeans 161 | gild, guild 162 | gilt, guilt 163 | giro, gyro 164 | gnaw, nor 165 | gneiss, nice 166 | gorilla, guerilla 167 | grate, great 168 | greave, grieve 169 | greys, graze 170 | grisly, grizzly 171 | groan, grown 172 | guessed, guest 173 | hail, hale 174 | hair, hare 175 | hall, haul 176 | hangar, hanger 177 | hart, heart 178 | haw, hoar, whore 179 | hay, hey 180 | heal, heel, he'll 181 | hear, here 182 | heard, herd 183 | he'd, heed 184 | heroin, heroine 185 | hew, hue 186 | hi, high 187 | higher, hire 188 | him, hymn 189 | ho, hoe 190 | hoard, horde 191 | hoarse, horse 192 | holey, holy, wholly 193 | hour, our 194 | idle, idol 195 | in, inn 196 | indict, indite 197 | it's, its 198 | jewel, joule 199 | key, quay 200 | knave, nave 201 | knead, need 202 | knew, new 203 | knight, night 204 | knit, nit 205 | knob, nob 206 | knock, nock 207 | knot, not 208 | know, no 209 | knows, nose 210 | laager, lager 211 | lac, lack 212 | lade, laid 213 | lain, lane 214 | lam, lamb 215 | laps, lapse 216 | larva, lava 217 | lase, laze 218 | law, lore 219 | lay, ley 220 | lea, lee 221 | leach, leech 222 | lead, led 223 | leak, leek 224 | lean, lien 225 | lessen, lesson 226 | levee, levy 227 | liar, lyre 228 | licence, license 229 | licker, liquor 230 | lie, lye 231 | lieu, loo 232 | links, lynx 233 | lo, low 234 | load, lode 235 | loan, lone 236 | locks, lox 237 | loop, loupe 238 | loot, lute 239 | made, maid 240 | mail, male 241 | main, mane 242 | maize, maze 243 | mall, maul 244 | manna, manner 245 | mantel, mantle 246 | mare, mayor 247 | mark, marque 248 | marshal, martial 249 | marten, martin 250 | mask, masque 251 | maw, more 252 | me, mi 253 | mean, mien 254 | meat, meet, mete 255 | medal, meddle 256 | metal, mettle 257 | meter, metre 258 | might, mite 259 | miner, minor, mynah 260 | mind, mined 261 | missed, mist 262 | moat, mote 263 | mode, mowed 264 | moor, more 265 | moose, mousse 266 | morning, mourning 267 | muscle, mussel 268 | naval, navel 269 | nay, neigh 270 | nigh, nye 271 | none, nun 272 | od, odd 273 | ode, owed 274 | oh, owe 275 | one, won 276 | packed, pact 277 | packs, pax 278 | pail, pale 279 | pain, pane 280 | pair, pare, pear 281 | palate, palette, pallet 282 | pascal, paschal 283 | paten, patten, pattern 284 | pause, paws, pores, pours 285 | pawn, porn 286 | pea, pee 287 | peace, piece 288 | peak, peek, peke, pique 289 | peal, peel 290 | pearl, purl 291 | pedal, peddle 292 | peer, pier 293 | pi, pie 294 | pica, pika 295 | place, plaice 296 | plain, plane 297 | pleas, please 298 | plum, plumb 299 | pole, poll 300 | poof, pouffe 301 | practice, practise 302 | praise, prays, preys 303 | principal, principle 304 | profit, prophet 305 | quarts, quartz 306 | quean, queen 307 | rain, reign, rein 308 | raise, rays, raze 309 | rap, wrap 310 | raw, roar 311 | read, reed 312 | read, red 313 | real, reel 314 | reek, wreak 315 | rest, wrest 316 | retch, wretch 317 | review, revue 318 | rheum, room 319 | right, rite, wright, write 320 | ring, wring 321 | road, rode 322 | roe, row 323 | role, roll 324 | roo, roux, rue 325 | rood, rude 326 | root, route 327 | rose, rows 328 | rota, rotor 329 | rote, wrote 330 | rough, ruff 331 | rouse, rows 332 | rung, wrung 333 | rye, wry 334 | saver, savour 335 | spade, spayed 336 | sale, sail 337 | sane, seine 338 | satire, satyr 339 | sauce, source 340 | saw, soar, sore 341 | scene, seen 342 | scull, skull 343 | sea, see 344 | seam, seem 345 | sear, seer, sere 346 | seas, sees, seize 347 | sew, so, sow 348 | shake, sheikh 349 | shear, sheer 350 | shoe, shoo 351 | sic, sick 352 | side, sighed 353 | sign, sine 354 | sink, synch 355 | slay, sleigh 356 | sloe, slow 357 | sole, soul 358 | some, sum 359 | son, sun 360 | sort, sought 361 | spa, spar 362 | staid, stayed 363 | stair, stare 364 | stake, steak 365 | stalk, stork 366 | stationary, stationery 367 | steal, steel 368 | stile, style 369 | storey, story 370 | straight, strait 371 | sweet, suite 372 | swat, swot 373 | tacks, tax 374 | tale, tail 375 | talk, torque 376 | tare, tear 377 | taught, taut, tort 378 | te, tea, tee 379 | team, teem 380 | tear, tier 381 | teas, tease 382 | terce, terse 383 | tern, turn 384 | there, their, they're 385 | threw, through 386 | throes, throws 387 | throne, thrown 388 | thyme, time 389 | tic, tick 390 | tide, tied 391 | tire, tyre 392 | to, too, two 393 | toad, toed, towed 394 | told, tolled 395 | tole, toll 396 | ton, tun 397 | tor, tore 398 | tough, tuff 399 | troop, troupe 400 | tuba, tuber 401 | vain, vane, vein 402 | vale, veil 403 | vial, vile 404 | wail, wale, whale 405 | wain, wane 406 | waist, waste 407 | wait, weight 408 | waive, wave 409 | wall, waul 410 | war, wore 411 | ware, wear, where 412 | warn, worn 413 | wart, wort 414 | watt, what 415 | wax, whacks 416 | way, weigh, whey 417 | we, wee, whee 418 | weak, week 419 | we'd, weed 420 | weal, we'll, wheel 421 | wean, ween 422 | weather, whether 423 | weaver, weever 424 | weir, we're 425 | were, whirr 426 | wet, whet 427 | wheald, wheeled 428 | which, witch 429 | whig, wig 430 | while, wile 431 | whine, wine 432 | whirl, whorl 433 | whirled, world 434 | whit, wit 435 | white, wight 436 | who's, whose 437 | woe, whoa 438 | wood, would 439 | yaw, yore, your, you're 440 | yoke, yolk 441 | you'll, yule 442 | -------------------------------------------------------------------------------- /data/parsers.ipynb: -------------------------------------------------------------------------------- 1 | { 2 | "cells": [ 3 | { 4 | "cell_type": "markdown", 5 | "metadata": {}, 6 | "source": [ 7 | "# Similar sounding words\n", 8 | "\n", 9 | "This is a list of similar sounding words that I have collected from various sources on the web and added to as I find new pairs.\n", 10 | "\n", 11 | "Unlike most homophone, homograph, and homonym resources this list is not targeting ESL or educational use. Instead it is designed for finding common errors in speech recognition texts. Specifically I use it with [Caster](https://caster.readthedocs.io/en/latest/) for voice programming.\n", 12 | "\n", 13 | "I currently have five different sources. I've downloaded their contents as text files, or in one case HTML and parsed appropriately. I have also linked to the original location of these files both inside the files and in the headings between Jupyter cells below.\n", 14 | "\n", 15 | "Unfortunately I wasn't thinking about reproducibility when I started this project, so most of the text files have had a bit of light preprocessing in a text editor. Given that I don't expect these source lists to change in the future, I don't think it will be a problem." 16 | ] 17 | }, 18 | { 19 | "cell_type": "code", 20 | "execution_count": 2, 21 | "metadata": {}, 22 | "outputs": [], 23 | "source": [ 24 | "from bs4 import BeautifulSoup # pip install beautifulsoup4\n", 25 | "from disjoint_set import DisjointSet # pip install disjoint-set\n", 26 | "import re\n", 27 | "from pprint import pformat" 28 | ] 29 | }, 30 | { 31 | "cell_type": "markdown", 32 | "metadata": {}, 33 | "source": [ 34 | "# [7esl.html](https://7esl.com/homophones/)" 35 | ] 36 | }, 37 | { 38 | "cell_type": "code", 39 | "execution_count": 3, 40 | "metadata": {}, 41 | "outputs": [], 42 | "source": [ 43 | "contents = open(\"7esl.html\", encoding=\"utf8\").read()\n", 44 | "parser = BeautifulSoup(contents, 'html.parser')" 45 | ] 46 | }, 47 | { 48 | "cell_type": "code", 49 | "execution_count": 4, 50 | "metadata": {}, 51 | "outputs": [ 52 | { 53 | "output_type": "execute_result", 54 | "data": { 55 | "text/plain": "ste', 'waist'],\n ['way', 'weigh'],\n ['weak', 'week'],\n ['weather', 'whether'],\n ['where', 'wear'],\n ['which', 'witch'],\n [\"who''s\", 'whose'],\n ['won', 'one'],\n ['would', 'wood'],\n [\"you''re\", 'your']]" 56 | }, 57 | "metadata": {}, 58 | "execution_count": 4 59 | } 60 | ], 61 | "source": [ 62 | "similar_7esl = []\n", 63 | "for element in parser.find_all(\"p\"):\n", 64 | " candidate = element.find(\"strong\")\n", 65 | " if candidate:\n", 66 | " partitions = candidate.text.lower().split(\" —– \")\n", 67 | " if len(partitions) > 1:\n", 68 | " words = []\n", 69 | " for p in partitions:\n", 70 | " words.extend(s.strip().replace('’', \"''\") for s in p.split(\"/\"))\n", 71 | " \n", 72 | " similar_7esl.append(words)\n", 73 | "similar_7esl" 74 | ] 75 | }, 76 | { 77 | "cell_type": "markdown", 78 | "metadata": {}, 79 | "source": [ 80 | "# [ku.txt](https://web.ku.edu/~edit/wordsall.html)" 81 | ] 82 | }, 83 | { 84 | "cell_type": "code", 85 | "execution_count": 5, 86 | "metadata": {}, 87 | "outputs": [ 88 | { 89 | "output_type": "execute_result", 90 | "data": { 91 | "text/plain": ",\n ['wane', 'wain'],\n ['want', 'wont'],\n ['wean', 'ween'],\n ['wear', 'ware'],\n ['weather', 'wether', 'whether'],\n ['whither', 'wither'],\n ['worst', 'wurst'],\n ['yew', 'ewe', 'you'],\n ['yoke', 'yolk']]" 92 | }, 93 | "metadata": {}, 94 | "execution_count": 5 95 | } 96 | ], 97 | "source": [ 98 | "contents = open(\"ku.txt\").read().lower().splitlines()[1:]\n", 99 | "similar_ku = [s.split(';') for s in contents]\n", 100 | "similar_ku" 101 | ] 102 | }, 103 | { 104 | "cell_type": "markdown", 105 | "metadata": {}, 106 | "source": [ 107 | "# [singularis.txt](http://www.singularis.ltd.uk/bifroest/misc/homophones-list.html)" 108 | ] 109 | }, 110 | { 111 | "cell_type": "code", 112 | "execution_count": 6, 113 | "metadata": {}, 114 | "outputs": [ 115 | { 116 | "output_type": "execute_result", 117 | "data": { 118 | "text/plain": "'],\n ['whirled', 'world'],\n ['whit', 'wit'],\n ['white', 'wight'],\n [\"who's\", 'whose'],\n ['woe', 'whoa'],\n ['wood', 'would'],\n ['yaw', 'yore', 'your', \"you're\"],\n ['yoke', 'yolk'],\n [\"you'll\", 'yule']]" 119 | }, 120 | "metadata": {}, 121 | "execution_count": 6 122 | } 123 | ], 124 | "source": [ 125 | "contents = open(\"singularis.txt\").read().lower().splitlines()[1:]\n", 126 | "similar_singularis = [s.split(', ') for s in contents]\n", 127 | "similar_singularis" 128 | ] 129 | }, 130 | { 131 | "cell_type": "markdown", 132 | "metadata": {}, 133 | "source": [ 134 | "# [teachingtreasures.txt](https://www.teachingtreasures.com.au/teaching-tools/Basic-worksheets/worksheets-english/upper/homophones-list.htm)" 135 | ] 136 | }, 137 | { 138 | "cell_type": "code", 139 | "execution_count": 7, 140 | "metadata": {}, 141 | "outputs": [ 142 | { 143 | "output_type": "execute_result", 144 | "data": { 145 | "text/plain": "['wrap', 'rap'],\n ['wrapped', 'rapped'],\n ['wreak', 'reek'],\n ['wrest', 'rest'],\n ['wretch', 'retch'],\n ['wring', 'ring'],\n ['write', 'right'],\n ['wrote', 'rote'],\n ['wrung', 'rung'],\n ['wry', 'rye']]" 146 | }, 147 | "metadata": {}, 148 | "execution_count": 7 149 | } 150 | ], 151 | "source": [ 152 | "contents = open(\"teachingtreasures.txt\").read().lower().splitlines()[1:]\n", 153 | "similar_teachingtreasures = [s.split(' ') for s in contents if s]\n", 154 | "similar_teachingtreasures" 155 | ] 156 | }, 157 | { 158 | "cell_type": "markdown", 159 | "metadata": {}, 160 | "source": [ 161 | "# [thoughtco](https://www.thoughtco.com/homonyms-homophones-and-homographs-a-b-1692660)" 162 | ] 163 | }, 164 | { 165 | "cell_type": "code", 166 | "execution_count": 8, 167 | "metadata": {}, 168 | "outputs": [ 169 | { 170 | "output_type": "execute_result", 171 | "data": { 172 | "text/plain": "],\n ['war', 'wore'],\n ['warn', 'worn'],\n ['way', 'weigh'],\n ['we', 'wee'],\n ['weak', 'week'],\n ['wear', 'where'],\n ['weather', 'whether'],\n ['which', 'witch'],\n ['wood', 'would'],\n ['your', \"you're\"]]" 173 | }, 174 | "metadata": {}, 175 | "execution_count": 8 176 | } 177 | ], 178 | "source": [ 179 | "contents = open(\"thoughtco.txt\").read().lower().splitlines()[1:]\n", 180 | "similar_thoughtco = [s.split(' ') for s in contents if s]\n", 181 | "similar_thoughtco" 182 | ] 183 | }, 184 | { 185 | "cell_type": "markdown", 186 | "metadata": {}, 187 | "source": [ 188 | "# My personal list of words not found above\n", 189 | "\n", 190 | "These were identified through trial and error (actually, just error) during dictation. Pull Requests welcome. These words tend to be commonly confused in dragon, but are not generally recognized as homophones." 191 | ] 192 | }, 193 | { 194 | "cell_type": "code", 195 | "execution_count": 9, 196 | "metadata": {}, 197 | "outputs": [ 198 | { 199 | "output_type": "execute_result", 200 | "data": { 201 | "text/plain": "wo'],\n ['93', 'ninety-three'],\n ['94', 'ninety-four'],\n ['95', 'ninety-five'],\n ['96', 'ninety-six'],\n ['97', 'ninety-seven'],\n ['98', 'ninety-eight'],\n ['99', 'ninety-nine'],\n ['100', 'one hundred']]" 202 | }, 203 | "metadata": {}, 204 | "execution_count": 9 205 | } 206 | ], 207 | "source": [ 208 | "contents = open(\"numbers.txt\").read().lower().splitlines()[1:]\n", 209 | "similar_numbers = [s.lower().split(',') for s in contents if s]\n", 210 | "similar_numbers" 211 | ] 212 | }, 213 | { 214 | "cell_type": "code", 215 | "execution_count": 10, 216 | "metadata": {}, 217 | "outputs": [ 218 | { 219 | "output_type": "execute_result", 220 | "data": { 221 | "text/plain": "', 'end'],\n ['are', 'r'],\n ['at', 'add', 'ad'],\n ['create', 'crate'],\n ['grade', 'grate', 'great', 'grid'],\n ['peer', 'pure'],\n ['poll', 'paul', 'pull', 'pole'],\n ['rust', 'rest'],\n ['right', 'rate']]" 222 | }, 223 | "metadata": {}, 224 | "execution_count": 10 225 | } 226 | ], 227 | "source": [ 228 | "contents = open(\"dusty.txt\").read().lower().splitlines()[1:]\n", 229 | "similar_dusty = [s.lower().split(',') for s in contents if s]\n", 230 | "similar_dusty" 231 | ] 232 | }, 233 | { 234 | "cell_type": "markdown", 235 | "metadata": {}, 236 | "source": [ 237 | "# Join it all together\n", 238 | "We want a list of all possible sets of words. This list of lists will surely contain duplicates (in fact, mostly duplicates).\n", 239 | "\n", 240 | "I have done a visual sanity check in all the outputs above, but I'll do another below." 241 | ] 242 | }, 243 | { 244 | "cell_type": "code", 245 | "execution_count": 11, 246 | "metadata": {}, 247 | "outputs": [], 248 | "source": [ 249 | "similar_words = []\n", 250 | "similar_words.extend(similar_7esl)\n", 251 | "similar_words.extend(similar_ku)\n", 252 | "similar_words.extend(similar_singularis)\n", 253 | "similar_words.extend(similar_teachingtreasures)\n", 254 | "similar_words.extend(similar_thoughtco)\n", 255 | "similar_words.extend(similar_numbers)\n", 256 | "similar_words.extend(similar_dusty)" 257 | ] 258 | }, 259 | { 260 | "cell_type": "code", 261 | "execution_count": 12, 262 | "metadata": { 263 | "tags": [ 264 | "outputPrepend" 265 | ] 266 | }, 267 | "outputs": [ 268 | { 269 | "output_type": "stream", 270 | "name": "stdout", 271 | "text": "\n39\n40\n41\n42\n43\n44\n45\n46\n47\n48\n49\n50\n51\n52\n53\n54\n55\n56\n57\n58\n59\n60\n61\n62\n63\n64\n65\n66\n67\n68\n69\n70\n71\n72\n73\n74\n75\n76\n77\n78\n79\n80\n81\n82\n83\n84\n85\n86\n87\n88\n89\n90\n91\n92\n93\n94\n95\n96\n97\n98\n99\n100\none hundred\n" 272 | } 273 | ], 274 | "source": [ 275 | "regex = re.compile(\"^[a-z'-]+$\")\n", 276 | "for similar in similar_words:\n", 277 | " if len(set(similar)) < 2:\n", 278 | " print(similar)\n", 279 | " for word in similar:\n", 280 | " if not regex.match(word):\n", 281 | " print(word)" 282 | ] 283 | }, 284 | { 285 | "cell_type": "markdown", 286 | "metadata": {}, 287 | "source": [ 288 | "# Dedup\n", 289 | "\n", 290 | "Removing duplicates is not trivial, since the different sets of words may include multiple variations (for example, one set has *your* and *you're* and another includes *yore*). It would be easy enough to just do a double loop, but disjoint sets are my favourite datastructure, and I've never actually had an opportunity to use them in production code before. Read up on the union-find algorithm if you're unfamiliar with it, it's pretty cool." 291 | ] 292 | }, 293 | { 294 | "cell_type": "code", 295 | "execution_count": 13, 296 | "metadata": {}, 297 | "outputs": [ 298 | { 299 | "output_type": "execute_result", 300 | "data": { 301 | "text/plain": " ['whither', 'wither'],\n [\"who''s\", \"who's\", 'whose'],\n ['whoa', 'woe'],\n ['wood', 'would'],\n ['worst', 'wurst'],\n ['yaw', 'yore', \"you''re\", \"you're\", 'your'],\n ['yoke', 'yolk'],\n [\"you'll\", 'yule']]" 302 | }, 303 | "metadata": {}, 304 | "execution_count": 13 305 | } 306 | ], 307 | "source": [ 308 | "word_set = DisjointSet()\n", 309 | "for word_list in similar_words:\n", 310 | " for word in word_list[1:]:\n", 311 | " word_set.union(word_list[0], word)\n", 312 | " \n", 313 | "wordsets = sorted(sorted(s) for s in word_set.itersets())\n", 314 | "wordsets" 315 | ] 316 | }, 317 | { 318 | "cell_type": "code", 319 | "execution_count": 14, 320 | "metadata": {}, 321 | "outputs": [ 322 | { 323 | "output_type": "execute_result", 324 | "data": { 325 | "text/plain": "761" 326 | }, 327 | "metadata": {}, 328 | "execution_count": 14 329 | } 330 | ], 331 | "source": [ 332 | "len(wordsets)" 333 | ] 334 | }, 335 | { 336 | "cell_type": "markdown", 337 | "metadata": {}, 338 | "source": [ 339 | "# Redupe\n", 340 | "\n", 341 | "The final output is a dictionary of words mapping to all the words similar to that word, not including that word." 342 | ] 343 | }, 344 | { 345 | "cell_type": "code", 346 | "execution_count": 15, 347 | "metadata": {}, 348 | "outputs": [ 349 | { 350 | "output_type": "execute_result", 351 | "data": { 352 | "text/plain": "al', 'marshall'],\n 'mark': ['marque'],\n 'marque': ['mark'],\n 'marry': ['material', 'materiel', 'merry'],\n 'material': ['marry', 'materiel', 'merry'],\n 'materiel': ['marry', 'material', 'merry'],\n ...}" 353 | }, 354 | "metadata": {}, 355 | "execution_count": 15 356 | } 357 | ], 358 | "source": [ 359 | "index = {}\n", 360 | "for similar in wordsets:\n", 361 | " for word in similar:\n", 362 | " local = similar.copy()\n", 363 | " local.remove(word)\n", 364 | " index[word] = local\n", 365 | " \n", 366 | "index" 367 | ] 368 | }, 369 | { 370 | "cell_type": "code", 371 | "execution_count": 16, 372 | "metadata": {}, 373 | "outputs": [ 374 | { 375 | "output_type": "execute_result", 376 | "data": { 377 | "text/plain": "1651" 378 | }, 379 | "metadata": {}, 380 | "execution_count": 16 381 | } 382 | ], 383 | "source": [ 384 | "len(index)" 385 | ] 386 | }, 387 | { 388 | "cell_type": "code", 389 | "execution_count": 17, 390 | "metadata": {}, 391 | "outputs": [], 392 | "source": [ 393 | "with open(\"../similar_sounding_words.py\", \"w\") as file:\n", 394 | " file.write(\"index = \" + pformat(index))" 395 | ] 396 | } 397 | ], 398 | "metadata": { 399 | "kernelspec": { 400 | "display_name": "Python 3", 401 | "language": "python", 402 | "name": "python3" 403 | }, 404 | "language_info": { 405 | "codemirror_mode": { 406 | "name": "ipython", 407 | "version": 3 408 | }, 409 | "file_extension": ".py", 410 | "mimetype": "text/x-python", 411 | "name": "python", 412 | "nbconvert_exporter": "python", 413 | "pygments_lexer": "ipython3", 414 | "version": "3.8.3-candidate" 415 | } 416 | }, 417 | "nbformat": 4, 418 | "nbformat_minor": 4 419 | } -------------------------------------------------------------------------------- /similar_sounding_words.py: -------------------------------------------------------------------------------- 1 | index = {'1': ['one', 'won'], 2 | '10': ['ten'], 3 | '100': ['one hundred'], 4 | '11': ['eleven'], 5 | '12': ['twelve'], 6 | '13': ['thirteen'], 7 | '14': ['fourteen'], 8 | '15': ['fifteen'], 9 | '16': ['sixteen'], 10 | '17': ['seventeen'], 11 | '18': ['eighteen'], 12 | '19': ['nineteen'], 13 | '2': ['to', 'toe', 'too', 'tow', 'two'], 14 | '20': ['twenty'], 15 | '21': ['twenty-one'], 16 | '22': ['twenty-two'], 17 | '23': ['twenty-three'], 18 | '24': ['twenty-four'], 19 | '25': ['twenty-five'], 20 | '26': ['twenty-six'], 21 | '27': ['twenty-seven'], 22 | '28': ['twenty-eight'], 23 | '29': ['twenty-nine'], 24 | '3': ['three'], 25 | '30': ['thirty'], 26 | '31': ['thirty-one'], 27 | '32': ['thirty-two'], 28 | '33': ['thirty-three'], 29 | '34': ['thirty-four'], 30 | '35': ['thirty-five'], 31 | '36': ['thirty-six'], 32 | '37': ['thirty-seven'], 33 | '38': ['thirty-eight'], 34 | '39': ['thirty-nine'], 35 | '4': ['for', 'fore', 'forth', 'four', 'fourth'], 36 | '40': ['forty'], 37 | '41': ['forty-one'], 38 | '42': ['forty-two'], 39 | '43': ['forty-three'], 40 | '44': ['forty-four'], 41 | '45': ['forty-five'], 42 | '46': ['forty-six'], 43 | '47': ['forty-seven'], 44 | '48': ['forty-eight'], 45 | '49': ['forty-nine'], 46 | '5': ['five'], 47 | '50': ['fifty'], 48 | '51': ['fifty-one'], 49 | '52': ['fifty-two'], 50 | '53': ['fifty-three'], 51 | '54': ['fifty-four'], 52 | '55': ['fifty-five'], 53 | '56': ['fifty-six'], 54 | '57': ['fifty-seven'], 55 | '58': ['fifty-eight'], 56 | '59': ['fifty-nine'], 57 | '6': ['six'], 58 | '60': ['sixty'], 59 | '61': ['sixty-one'], 60 | '62': ['sixty-two'], 61 | '63': ['sixty-three'], 62 | '64': ['sixty-four'], 63 | '65': ['sixty-five'], 64 | '66': ['sixty-six'], 65 | '67': ['sixty-seven'], 66 | '68': ['sixty-eight'], 67 | '69': ['sixty-nine'], 68 | '7': ['seven'], 69 | '70': ['seventy'], 70 | '71': ['seventy-one'], 71 | '72': ['seventy-two'], 72 | '73': ['seventy-three'], 73 | '74': ['seventy-four'], 74 | '75': ['seventy-five'], 75 | '76': ['seventy-six'], 76 | '77': ['seventy-seven'], 77 | '78': ['seventy-eight'], 78 | '79': ['seventy-nine'], 79 | '8': ['ate', 'eight'], 80 | '80': ['eighty'], 81 | '81': ['eighty-one'], 82 | '82': ['eighty-two'], 83 | '83': ['eighty-three'], 84 | '84': ['eighty-four'], 85 | '85': ['eighty-five'], 86 | '86': ['eighty-six'], 87 | '87': ['eighty-seven'], 88 | '88': ['eighty-eight'], 89 | '89': ['eighty-nine'], 90 | '9': ['nine'], 91 | '90': ['ninety'], 92 | '91': ['ninety-one'], 93 | '92': ['ninety-two'], 94 | '93': ['ninety-three'], 95 | '94': ['ninety-four'], 96 | '95': ['ninety-five'], 97 | '96': ['ninety-six'], 98 | '97': ['ninety-seven'], 99 | '98': ['ninety-eight'], 100 | '99': ['ninety-nine'], 101 | 'accede': ['exceed'], 102 | 'accept': ['except'], 103 | 'access': ['excess'], 104 | 'accessary': ['accessory'], 105 | 'accessory': ['accessary'], 106 | 'ad': ['add', 'at'], 107 | 'adapt': ['adept', 'adopt'], 108 | 'add': ['ad', 'at'], 109 | 'adept': ['adapt', 'adopt'], 110 | 'adopt': ['adapt', 'adept'], 111 | 'advice': ['advise'], 112 | 'advise': ['advice'], 113 | 'aerie': ['airy', 'eerie'], 114 | 'aid': ['aide'], 115 | 'aide': ['aid'], 116 | 'ail': ['ale'], 117 | 'air': ['ere', 'heir'], 118 | 'airy': ['aerie', 'eerie'], 119 | 'aisle': ["i'll", 'isle'], 120 | 'ale': ['ail'], 121 | 'all': ['awl'], 122 | 'alley': ['ally'], 123 | 'allowed': ['aloud'], 124 | 'allready': ['already'], 125 | 'allude': ['elude'], 126 | 'allusion': ['illusion'], 127 | 'ally': ['alley'], 128 | 'alms': ['arms'], 129 | 'aloud': ['allowed'], 130 | 'already': ['allready'], 131 | 'altar': ['alter'], 132 | 'alter': ['altar'], 133 | 'an': ['and', 'end'], 134 | 'and': ['an', 'end'], 135 | 'ant': ["aren't", 'aunt'], 136 | 'appraise': ['apprise'], 137 | 'apprise': ['appraise'], 138 | 'arc': ['ark'], 139 | 'are': ['r'], 140 | "aren't": ['ant', 'aunt'], 141 | 'ark': ['arc'], 142 | 'arms': ['alms'], 143 | 'ascent': ['assent'], 144 | 'assay': ['essay'], 145 | 'assent': ['ascent'], 146 | 'at': ['ad', 'add'], 147 | 'ate': ['8', 'eight'], 148 | 'attendance': ['attendants'], 149 | 'attendants': ['attendance'], 150 | 'auger': ['augur'], 151 | 'aught': ['ought'], 152 | 'augur': ['auger'], 153 | 'auk': ['orc'], 154 | 'aunt': ['ant', "aren't"], 155 | 'aural': ['oral'], 156 | 'auricle': ['oracle'], 157 | 'average': ['median', 'normal'], 158 | 'away': ['aweigh'], 159 | 'awe': ['oar', 'oh', 'or', 'ore', 'owe'], 160 | 'aweigh': ['away'], 161 | 'awl': ['all'], 162 | 'axel': ['axle'], 163 | 'axes': ['axis'], 164 | 'axis': ['axes'], 165 | 'axle': ['axel'], 166 | 'aye': ['eye', 'i'], 167 | 'bail': ['bale'], 168 | 'bait': ['bate'], 169 | 'baited': ['bated'], 170 | 'baize': ['bays'], 171 | 'bald': ['bawled'], 172 | 'bale': ['bail'], 173 | 'ball': ['bawl'], 174 | 'band': ['banned'], 175 | 'banned': ['band'], 176 | 'bard': ['barred'], 177 | 'bare': ['bear'], 178 | 'bark': ['barque'], 179 | 'baron': ['barren'], 180 | 'barque': ['bark'], 181 | 'barred': ['bard'], 182 | 'barren': ['baron'], 183 | 'base': ['bass'], 184 | 'based': ['baste'], 185 | 'bases': ['basis'], 186 | 'basis': ['bases'], 187 | 'bass': ['base'], 188 | 'baste': ['based'], 189 | 'bate': ['bait'], 190 | 'bated': ['baited'], 191 | 'bawl': ['ball'], 192 | 'bawled': ['bald'], 193 | 'bay': ['bey'], 194 | 'bays': ['baize'], 195 | 'bazaar': ['bizarre'], 196 | 'be': ['bee'], 197 | 'beach': ['beech'], 198 | 'bean': ['been'], 199 | 'bear': ['bare'], 200 | 'beat': ['beet'], 201 | 'beau': ['bough', 'bow'], 202 | 'bee': ['be'], 203 | 'beech': ['beach'], 204 | 'been': ['bean'], 205 | 'beer': ['bier'], 206 | 'beet': ['beat'], 207 | 'bel': ['bell', 'belle'], 208 | 'bell': ['bel', 'belle'], 209 | 'belle': ['bel', 'bell'], 210 | 'berry': ['bury'], 211 | 'berth': ['birth'], 212 | 'bey': ['bay'], 213 | 'bier': ['beer'], 214 | 'bight': ['bite', 'byte'], 215 | 'billed': ['build'], 216 | 'birth': ['berth'], 217 | 'bite': ['bight', 'byte'], 218 | 'bitten': ['bittern'], 219 | 'bittern': ['bitten'], 220 | 'bizarre': ['bazaar'], 221 | 'blew': ['blue'], 222 | 'bloc': ['block'], 223 | 'block': ['bloc'], 224 | 'blue': ['blew'], 225 | 'boar': ['bore'], 226 | 'board': ['bored'], 227 | 'boarder': ['border'], 228 | 'bold': ['bowled'], 229 | 'bolder': ['boulder'], 230 | 'boos': ['booze'], 231 | 'bootie': ['booty'], 232 | 'booty': ['bootie'], 233 | 'booze': ['boos'], 234 | 'border': ['boarder'], 235 | 'bore': ['boar'], 236 | 'bored': ['board'], 237 | 'born': ['borne'], 238 | 'borne': ['born'], 239 | 'borough': ['burro', 'burrow'], 240 | 'bough': ['beau', 'bow'], 241 | 'bouillon': ['bullion'], 242 | 'boulder': ['bolder'], 243 | 'bow': ['beau', 'bough'], 244 | 'bowled': ['bold'], 245 | 'boy': ['buoy'], 246 | 'brae': ['bray'], 247 | 'braid': ['brayed'], 248 | 'braise': ['brays', 'braze'], 249 | 'brake': ['break'], 250 | 'bray': ['brae'], 251 | 'brayed': ['braid'], 252 | 'brays': ['braise', 'braze'], 253 | 'braze': ['braise', 'brays'], 254 | 'breach': ['breech'], 255 | 'bread': ['bred'], 256 | 'break': ['brake'], 257 | 'bred': ['bread'], 258 | 'breech': ['breach'], 259 | 'brewed': ['brood'], 260 | 'brews': ['bruise'], 261 | 'bridal': ['bridle'], 262 | 'bridle': ['bridal'], 263 | 'bring': ['take'], 264 | 'broach': ['brooch'], 265 | 'brooch': ['broach'], 266 | 'brood': ['brewed'], 267 | 'brows': ['browse'], 268 | 'browse': ['brows'], 269 | 'bruise': ['brews'], 270 | 'build': ['billed'], 271 | 'bullion': ['bouillon'], 272 | 'buoy': ['boy'], 273 | 'bur': ['burr'], 274 | 'burr': ['bur'], 275 | 'burro': ['borough', 'burrow'], 276 | 'burrow': ['borough', 'burro'], 277 | 'bury': ['berry'], 278 | 'but': ['butt'], 279 | 'butt': ['but'], 280 | 'buy': ['by', 'bye'], 281 | 'buyer': ['byre'], 282 | 'by': ['buy', 'bye'], 283 | 'bye': ['buy', 'by'], 284 | 'byre': ['buyer'], 285 | 'byte': ['bight', 'bite'], 286 | 'caddie': ['caddy'], 287 | 'caddy': ['caddie'], 288 | 'calendar': ['calender'], 289 | 'calender': ['calendar'], 290 | 'call': ['caul'], 291 | 'callous': ['callus'], 292 | 'callus': ['callous'], 293 | 'cannon': ['canon'], 294 | 'canon': ['cannon'], 295 | 'canter': ['cantor'], 296 | 'cantor': ['canter'], 297 | 'canvas': ['canvass'], 298 | 'canvass': ['canvas'], 299 | 'capital': ['capitol'], 300 | 'capitol': ['capital'], 301 | 'carat': ['carrot'], 302 | 'carol': ['carrel'], 303 | 'carrel': ['carol'], 304 | 'carrot': ['carat'], 305 | 'cast': ['caste'], 306 | 'caste': ['cast'], 307 | 'caster': ['castor'], 308 | 'castor': ['caster'], 309 | 'caught': ['court'], 310 | 'caul': ['call'], 311 | 'caw': ['core', 'corps'], 312 | 'cede': ['seed'], 313 | 'ceiling': ['sealing'], 314 | 'cell': ['sell'], 315 | 'cellar': ['seller'], 316 | 'censer': ['censor', 'censure', 'sensor'], 317 | 'censor': ['censer', 'censure', 'sensor'], 318 | 'censure': ['censer', 'censor', 'sensor'], 319 | 'census': ['sense'], 320 | 'cent': ['scent', 'sent'], 321 | 'cereal': ['serial'], 322 | 'cession': ['session'], 323 | 'chance': ['chants'], 324 | 'chantey': ['shanty'], 325 | 'chants': ['chance'], 326 | 'chased': ['chaste'], 327 | 'chaste': ['chased'], 328 | 'cheap': ['cheep'], 329 | 'check': ['cheque'], 330 | 'cheep': ['cheap'], 331 | 'cheque': ['check'], 332 | 'chews': ['choose'], 333 | 'chic': ['sheik'], 334 | 'chile': ['chili', 'chilli', 'chilly'], 335 | 'chili': ['chile', 'chilli', 'chilly'], 336 | 'chilli': ['chile', 'chili', 'chilly'], 337 | 'chilly': ['chile', 'chili', 'chilli'], 338 | 'choir': ['quire'], 339 | 'choose': ['chews'], 340 | 'choral': ['coral'], 341 | 'chord': ['cord', 'cored'], 342 | 'chute': ['shoot'], 343 | 'cite': ['sight', 'site'], 344 | 'clack': ['claque'], 345 | 'claque': ['clack'], 346 | 'clause': ['claws'], 347 | 'claws': ['clause'], 348 | 'clew': ['clue'], 349 | 'climb': ['clime'], 350 | 'clime': ['climb'], 351 | 'close': ['clothes', 'cloze'], 352 | 'clothes': ['close', 'cloze'], 353 | 'cloze': ['close', 'clothes'], 354 | 'clue': ['clew'], 355 | 'coal': ['kohl'], 356 | 'coarse': ['course'], 357 | 'coign': ['coin'], 358 | 'coin': ['coign'], 359 | 'colonel': ['kernel'], 360 | 'complacent': ['complaisant'], 361 | 'complaisant': ['complacent'], 362 | 'complement': ['compliment'], 363 | 'compliment': ['complement'], 364 | 'confidant': ['confident'], 365 | 'confident': ['confidant'], 366 | 'coo': ['coup'], 367 | 'cops': ['copse'], 368 | 'copse': ['cops'], 369 | 'coral': ['choral'], 370 | 'cord': ['chord', 'cored'], 371 | 'core': ['caw', 'corps'], 372 | 'cored': ['chord', 'cord'], 373 | 'corps': ['caw', 'core'], 374 | 'council': ['counsel'], 375 | 'counsel': ['council'], 376 | 'coup': ['coo'], 377 | 'course': ['coarse'], 378 | 'court': ['caught'], 379 | 'cousin': ['cozen'], 380 | 'coward': ['cowered'], 381 | 'cowered': ['coward'], 382 | 'cozen': ['cousin'], 383 | 'crate': ['create'], 384 | 'creak': ['creek'], 385 | 'create': ['crate'], 386 | 'creek': ['creak'], 387 | 'crewel': ['cruel'], 388 | 'crews': ['cruise'], 389 | 'cruel': ['crewel'], 390 | 'cruise': ['crews'], 391 | 'cue': ['kyu', 'queue'], 392 | 'curb': ['kerb'], 393 | 'currant': ['current'], 394 | 'current': ['currant'], 395 | 'cygnet': ['signet'], 396 | 'cymbal': ['cymbol', 'symbol'], 397 | 'cymbol': ['cymbal', 'symbol'], 398 | 'dam': ['damn'], 399 | 'damn': ['dam'], 400 | 'days': ['daze'], 401 | 'daze': ['days'], 402 | 'dear': ['deer'], 403 | 'deer': ['dear'], 404 | 'dense': ['dents'], 405 | 'dents': ['dense'], 406 | 'depravation': ['deprivation'], 407 | 'deprivation': ['depravation'], 408 | 'descent': ['dissent'], 409 | 'desert': ['dessert'], 410 | 'desperate': ['disparate'], 411 | 'dessert': ['desert'], 412 | 'deviser': ['divisor'], 413 | 'dew': ['do', 'due'], 414 | 'die': ['dye'], 415 | 'disburse': ['disperse'], 416 | 'discreet': ['discrete'], 417 | 'discrete': ['discreet'], 418 | 'disparate': ['desperate'], 419 | 'disperse': ['disburse'], 420 | 'dissent': ['descent'], 421 | 'divisor': ['deviser'], 422 | 'do': ['dew', 'due'], 423 | 'doe': ['doh', 'dough'], 424 | 'does': ['doze'], 425 | 'doh': ['doe', 'dough'], 426 | 'done': ['dun'], 427 | 'dough': ['doe', 'doh'], 428 | 'douse': ['dowse'], 429 | 'dowse': ['douse'], 430 | 'doze': ['does'], 431 | 'draft': ['draught'], 432 | 'draught': ['draft'], 433 | 'dual': ['duel'], 434 | 'due': ['dew', 'do'], 435 | 'duel': ['dual'], 436 | 'dun': ['done'], 437 | 'dye': ['die'], 438 | 'dyeing': ['dying'], 439 | 'dying': ['dyeing'], 440 | 'each': ['either'], 441 | 'earn': ['urn'], 442 | 'eave': ['eve'], 443 | 'ecology': ['environment'], 444 | 'eek': ['eke'], 445 | 'eerie': ['aerie', 'airy'], 446 | 'eery': ['eyrie'], 447 | 'eight': ['8', 'ate'], 448 | 'eighteen': ['18'], 449 | 'eighty': ['80'], 450 | 'eighty-eight': ['88'], 451 | 'eighty-five': ['85'], 452 | 'eighty-four': ['84'], 453 | 'eighty-nine': ['89'], 454 | 'eighty-one': ['81'], 455 | 'eighty-seven': ['87'], 456 | 'eighty-six': ['86'], 457 | 'eighty-three': ['83'], 458 | 'eighty-two': ['82'], 459 | 'either': ['each'], 460 | 'eke': ['eek'], 461 | 'eleven': ['11'], 462 | 'elicit': ['illicit'], 463 | 'elude': ['allude'], 464 | 'eminent': ['imminent'], 465 | 'end': ['an', 'and'], 466 | 'environment': ['ecology'], 467 | 'epic': ['epoch'], 468 | 'epoch': ['epic'], 469 | 'ere': ['air', 'heir'], 470 | 'essay': ['assay'], 471 | 'eve': ['eave'], 472 | 'ewe': ['yew', 'you'], 473 | 'ewes': ['use', 'yews'], 474 | 'exceed': ['accede'], 475 | 'except': ['accept'], 476 | 'excess': ['access'], 477 | 'extant': ['extent'], 478 | 'extent': ['extant'], 479 | 'eye': ['aye', 'i'], 480 | 'eyelet': ['islet'], 481 | 'eyrie': ['eery'], 482 | 'facts': ['fax'], 483 | 'fah': ['far'], 484 | 'fain': ['feign'], 485 | 'faint': ['feint'], 486 | 'fair': ['fare'], 487 | 'fairy': ['ferry'], 488 | 'far': ['fah'], 489 | 'fare': ['fair'], 490 | 'farther': ['father'], 491 | 'father': ['farther'], 492 | 'faun': ['fawn'], 493 | 'fawn': ['faun'], 494 | 'fax': ['facts'], 495 | 'fay': ['fey'], 496 | 'faze': ['phase'], 497 | 'feat': ['feet', 'fete'], 498 | 'feet': ['feat', 'fete'], 499 | 'feign': ['fain'], 500 | 'feint': ['faint'], 501 | 'ferrule': ['ferule'], 502 | 'ferry': ['fairy'], 503 | 'ferule': ['ferrule'], 504 | 'fete': ['feat', 'feet'], 505 | 'few': ['phew'], 506 | 'fey': ['fay'], 507 | 'fie': ['phi'], 508 | 'fifteen': ['15'], 509 | 'fifty': ['50'], 510 | 'fifty-eight': ['58'], 511 | 'fifty-five': ['55'], 512 | 'fifty-four': ['54'], 513 | 'fifty-nine': ['59'], 514 | 'fifty-one': ['51'], 515 | 'fifty-seven': ['57'], 516 | 'fifty-six': ['56'], 517 | 'fifty-three': ['53'], 518 | 'fifty-two': ['52'], 519 | 'file': ['phial'], 520 | 'find': ['fined'], 521 | 'fined': ['find'], 522 | 'fir': ['fur'], 523 | 'fisher': ['fissure'], 524 | 'fissure': ['fisher'], 525 | 'five': ['5'], 526 | 'fizz': ['phiz'], 527 | 'flair': ['flare'], 528 | 'flare': ['flair'], 529 | 'flaw': ['floor'], 530 | 'flea': ['flee'], 531 | 'flecks': ['flex'], 532 | 'flee': ['flea'], 533 | 'flew': ['flu', 'flue'], 534 | 'flex': ['flecks'], 535 | 'floe': ['flow'], 536 | 'floor': ['flaw'], 537 | 'flour': ['flower'], 538 | 'flow': ['floe'], 539 | 'flower': ['flour'], 540 | 'flu': ['flew', 'flue'], 541 | 'flue': ['flew', 'flu'], 542 | 'foaled': ['fold'], 543 | 'fold': ['foaled'], 544 | 'for': ['4', 'fore', 'forth', 'four', 'fourth'], 545 | 'forbear': ['forebear'], 546 | 'fore': ['4', 'for', 'forth', 'four', 'fourth'], 547 | 'forebear': ['forbear'], 548 | 'foreword': ['forward'], 549 | 'formally': ['formerly'], 550 | 'formerly': ['formally'], 551 | 'fort': ['fought'], 552 | 'forth': ['4', 'for', 'fore', 'four', 'fourth'], 553 | 'forty': ['40'], 554 | 'forty-eight': ['48'], 555 | 'forty-five': ['45'], 556 | 'forty-four': ['44'], 557 | 'forty-nine': ['49'], 558 | 'forty-one': ['41'], 559 | 'forty-seven': ['47'], 560 | 'forty-six': ['46'], 561 | 'forty-three': ['43'], 562 | 'forty-two': ['42'], 563 | 'forward': ['foreword'], 564 | 'fought': ['fort'], 565 | 'foul': ['fowl'], 566 | 'four': ['4', 'for', 'fore', 'forth', 'fourth'], 567 | 'fourteen': ['14'], 568 | 'fourth': ['4', 'for', 'fore', 'forth', 'four'], 569 | 'fowl': ['foul'], 570 | 'franc': ['frank'], 571 | 'frank': ['franc'], 572 | 'frays': ['phrase'], 573 | 'freeze': ['frieze'], 574 | 'friar': ['fryer'], 575 | 'frieze': ['freeze'], 576 | 'fryer': ['friar'], 577 | 'fur': ['fir'], 578 | 'furs': ['furze'], 579 | 'furze': ['furs'], 580 | 'gaff': ['gaffe'], 581 | 'gaffe': ['gaff'], 582 | 'gage': ['gauge'], 583 | 'gait': ['gate'], 584 | 'galipot': ['gallipot'], 585 | 'gallipot': ['galipot'], 586 | 'gallop': ['galop'], 587 | 'galop': ['gallop'], 588 | 'gamble': ['gambol'], 589 | 'gambol': ['gamble'], 590 | 'gate': ['gait'], 591 | 'gauge': ['gage'], 592 | 'gays': ['gaze'], 593 | 'gaze': ['gays'], 594 | 'gel': ['jell'], 595 | 'gene': ['jean'], 596 | 'genes': ['jeans'], 597 | 'genius': ['genus'], 598 | 'genus': ['genius'], 599 | 'gibe': ['jibe'], 600 | 'gild': ['guild'], 601 | 'gilt': ['guilt'], 602 | 'giro': ['gyro'], 603 | 'gist': ['jest'], 604 | 'glacier': ['glazier'], 605 | 'glazier': ['glacier'], 606 | 'gnaw': ['naw', 'nor'], 607 | 'gneiss': ['nice'], 608 | 'gnu': ['knew', 'new'], 609 | 'gofer': ['gopher'], 610 | 'gopher': ['gofer'], 611 | 'gored': ['gourd'], 612 | 'gorilla': ['guerilla', 'guerrilla'], 613 | 'gourd': ['gored'], 614 | 'grade': ['grate', 'great', 'grid'], 615 | 'grate': ['grade', 'great', 'grid'], 616 | 'graze': ['greys'], 617 | 'grease': ['greece'], 618 | 'great': ['grade', 'grate', 'grid'], 619 | 'greave': ['grieve'], 620 | 'greece': ['grease'], 621 | 'greys': ['graze'], 622 | 'grid': ['grade', 'grate', 'great'], 623 | 'grieve': ['greave'], 624 | 'grill': ['grille'], 625 | 'grille': ['grill'], 626 | 'grisly': ['grizzly'], 627 | 'grizzly': ['grisly'], 628 | 'groan': ['grown'], 629 | 'grown': ['groan'], 630 | 'guarantee': ['guaranty'], 631 | 'guaranty': ['guarantee'], 632 | 'guerilla': ['gorilla', 'guerrilla'], 633 | 'guerrilla': ['gorilla', 'guerilla'], 634 | 'guessed': ['guest'], 635 | 'guest': ['guessed'], 636 | 'guild': ['gild'], 637 | 'guilt': ['gilt'], 638 | 'guise': ['guys'], 639 | 'guys': ['guise'], 640 | 'gyro': ['giro'], 641 | 'hail': ['hale'], 642 | 'hair': ['hare'], 643 | 'hairier': ['harrier'], 644 | 'hale': ['hail'], 645 | 'hall': ['haul'], 646 | 'halve': ['have'], 647 | 'handsome': ['hansom'], 648 | 'hangar': ['hanger'], 649 | 'hanger': ['hangar'], 650 | 'hansom': ['handsome'], 651 | 'hare': ['hair'], 652 | 'harrier': ['hairier'], 653 | 'hart': ['heart'], 654 | 'haul': ['hall'], 655 | 'have': ['halve'], 656 | 'haw': ['hoar', 'whore'], 657 | 'hay': ['hey'], 658 | "he'd": ['heed'], 659 | "he'll": ['heal', 'heel'], 660 | 'heal': ["he'll", 'heel'], 661 | 'hear': ['here'], 662 | 'heard': ['herd'], 663 | 'heart': ['hart'], 664 | 'heed': ["he'd"], 665 | 'heel': ["he'll", 'heal'], 666 | 'heir': ['air', 'ere'], 667 | 'herd': ['heard'], 668 | 'here': ['hear'], 669 | 'heroin': ['heroine'], 670 | 'heroine': ['heroin'], 671 | 'hew': ['hue'], 672 | 'hey': ['hay'], 673 | 'hi': ['high'], 674 | 'high': ['hi'], 675 | 'higher': ['hire'], 676 | 'him': ['hymn'], 677 | 'hire': ['higher'], 678 | 'ho': ['hoe'], 679 | 'hoar': ['haw', 'whore'], 680 | 'hoard': ['horde'], 681 | 'hoarse': ['horse'], 682 | 'hoe': ['ho'], 683 | 'hoes': ['hose'], 684 | 'hole': ['whole'], 685 | 'holey': ['holy', 'wholly'], 686 | 'holy': ['holey', 'wholly'], 687 | 'hoop': ['whoop'], 688 | 'horde': ['hoard'], 689 | 'horse': ['hoarse'], 690 | 'hose': ['hoes'], 691 | 'hostel': ['hostile'], 692 | 'hostile': ['hostel'], 693 | 'hour': ['our'], 694 | 'hue': ['hew'], 695 | 'humerus': ['humorous'], 696 | 'humorous': ['humerus'], 697 | 'hurdle': ['hurtle'], 698 | 'hurtle': ['hurdle'], 699 | 'hymn': ['him'], 700 | 'hypercritical': ['hypocritical'], 701 | 'hypocritical': ['hypercritical'], 702 | 'i': ['aye', 'eye'], 703 | "i'll": ['aisle', 'isle'], 704 | 'idle': ['idol', 'idyll'], 705 | 'idol': ['idle', 'idyll'], 706 | 'idyll': ['idle', 'idol'], 707 | 'illicit': ['elicit'], 708 | 'illusion': ['allusion'], 709 | 'imminent': ['eminent'], 710 | 'in': ['inn'], 711 | 'incidence': ['incidents'], 712 | 'incidents': ['incidence'], 713 | 'incite': ['insight'], 714 | 'incredible': ['incredulous'], 715 | 'incredulous': ['incredible'], 716 | 'indict': ['indite'], 717 | 'indite': ['indict'], 718 | 'inequity': ['iniquity'], 719 | 'ingenious': ['ingenuous'], 720 | 'ingenuous': ['ingenious'], 721 | 'iniquity': ['inequity'], 722 | 'inn': ['in'], 723 | 'insight': ['incite'], 724 | 'intense': ['intents'], 725 | 'intents': ['intense'], 726 | 'interstate': ['intrastate'], 727 | 'intrastate': ['interstate'], 728 | 'isle': ['aisle', "i'll"], 729 | 'islet': ['eyelet'], 730 | "it's": ['its'], 731 | 'its': ["it's"], 732 | 'jalousie': ['jealousy'], 733 | 'jam': ['jamb'], 734 | 'jamb': ['jam'], 735 | 'jealousy': ['jalousie'], 736 | 'jean': ['gene'], 737 | 'jeans': ['genes'], 738 | 'jell': ['gel'], 739 | 'jest': ['gist'], 740 | 'jewel': ['joule'], 741 | 'jibe': ['gibe'], 742 | 'joule': ['jewel'], 743 | 'judicial': ['judicious'], 744 | 'judicious': ['judicial'], 745 | 'kerb': ['curb'], 746 | 'kernel': ['colonel'], 747 | 'key': ['quay'], 748 | 'kill': ['kiln'], 749 | 'kiln': ['kill'], 750 | 'knave': ['nave'], 751 | 'knead': ['kneed', 'need'], 752 | 'kneed': ['knead', 'need'], 753 | 'knew': ['gnu', 'new'], 754 | 'knight': ['night'], 755 | 'knit': ['nit'], 756 | 'knob': ['nob'], 757 | 'knock': ['nock'], 758 | 'knot': ['not'], 759 | 'know': ['no'], 760 | 'knows': ['nose'], 761 | 'kohl': ['coal'], 762 | 'kyu': ['cue', 'queue'], 763 | 'laager': ['lager'], 764 | 'lac': ['lack'], 765 | 'lack': ['lac'], 766 | 'lacks': ['lax'], 767 | 'lade': ['laid'], 768 | 'lager': ['laager'], 769 | 'laid': ['lade'], 770 | 'lain': ['lane'], 771 | 'lam': ['lamb'], 772 | 'lama': ['llama'], 773 | 'lamb': ['lam'], 774 | 'lane': ['lain'], 775 | 'laps': ['lapse'], 776 | 'lapse': ['laps'], 777 | 'larva': ['lava'], 778 | 'lase': ['laze'], 779 | 'lava': ['larva'], 780 | 'law': ['lore'], 781 | 'lax': ['lacks'], 782 | 'lay': ['lei', 'ley'], 783 | 'laze': ['lase'], 784 | 'lea': ['lee'], 785 | 'leach': ['leech'], 786 | 'lead': ['led'], 787 | 'leak': ['leek'], 788 | 'lean': ['lien'], 789 | 'leased': ['least'], 790 | 'least': ['leased'], 791 | 'led': ['lead'], 792 | 'lee': ['lea'], 793 | 'leech': ['leach'], 794 | 'leek': ['leak'], 795 | 'lei': ['lay', 'ley'], 796 | 'lessen': ['lesson'], 797 | 'lesser': ['lessor'], 798 | 'lesson': ['lessen'], 799 | 'lessor': ['lesser'], 800 | 'levee': ['levy'], 801 | 'levy': ['levee'], 802 | 'ley': ['lay', 'lei'], 803 | 'liable': ['libel'], 804 | 'liar': ['lyre'], 805 | 'libel': ['liable'], 806 | 'licence': ['license'], 807 | 'license': ['licence'], 808 | 'lichen': ['liken'], 809 | 'licker': ['liquor'], 810 | 'lie': ['lye'], 811 | 'lien': ['lean'], 812 | 'lieu': ['loo'], 813 | 'liken': ['lichen'], 814 | 'links': ['lynx'], 815 | 'liquor': ['licker'], 816 | 'literal': ['littoral'], 817 | 'littoral': ['literal'], 818 | 'llama': ['lama'], 819 | 'lo': ['low'], 820 | 'load': ['lode'], 821 | 'loan': ['lone'], 822 | 'locks': ['lox'], 823 | 'lode': ['load'], 824 | 'lone': ['loan'], 825 | 'loo': ['lieu'], 826 | 'loop': ['loupe'], 827 | 'loot': ['lute'], 828 | 'lore': ['law'], 829 | 'loupe': ['loop'], 830 | 'low': ['lo'], 831 | 'lox': ['locks'], 832 | 'lute': ['loot'], 833 | 'lye': ['lie'], 834 | 'lynx': ['links'], 835 | 'lyre': ['liar'], 836 | 'macintosh': ['mackintosh', 'mcintosh'], 837 | 'mackintosh': ['macintosh', 'mcintosh'], 838 | 'made': ['maid'], 839 | 'magnate': ['magnet'], 840 | 'magnet': ['magnate'], 841 | 'magnificent': ['munificent'], 842 | 'maid': ['made'], 843 | 'mail': ['male'], 844 | 'main': ['mane'], 845 | 'maize': ['maze'], 846 | 'male': ['mail'], 847 | 'mall': ['maul'], 848 | 'mane': ['main'], 849 | 'manikin': ['mannequin'], 850 | 'manna': ['manner', 'manor'], 851 | 'mannequin': ['manikin'], 852 | 'manner': ['manna', 'manor'], 853 | 'manor': ['manna', 'manner'], 854 | 'mantel': ['mantle'], 855 | 'mantle': ['mantel'], 856 | 'mare': ['mayor'], 857 | 'marital': ['marshal', 'marshall', 'martial'], 858 | 'mark': ['marque'], 859 | 'marque': ['mark'], 860 | 'marry': ['material', 'materiel', 'merry'], 861 | 'marshal': ['marital', 'marshall', 'martial'], 862 | 'marshall': ['marital', 'marshal', 'martial'], 863 | 'marten': ['martian', 'martin'], 864 | 'martial': ['marital', 'marshal', 'marshall'], 865 | 'martian': ['marten', 'martin'], 866 | 'martin': ['marten', 'martian'], 867 | 'mask': ['masque'], 868 | 'masque': ['mask'], 869 | 'massed': ['mast'], 870 | 'mast': ['massed'], 871 | 'material': ['marry', 'materiel', 'merry'], 872 | 'materiel': ['marry', 'material', 'merry'], 873 | 'maul': ['mall'], 874 | 'maw': ['moor', 'more'], 875 | 'mayor': ['mare'], 876 | 'maze': ['maize'], 877 | 'mcintosh': ['macintosh', 'mackintosh'], 878 | 'me': ['mi'], 879 | 'mean': ['mien'], 880 | 'meat': ['meet', 'mete'], 881 | 'medal': ['meddle', 'metal', 'mettle'], 882 | 'meddle': ['medal', 'metal', 'mettle'], 883 | 'median': ['average', 'normal'], 884 | 'meet': ['meat', 'mete'], 885 | 'merry': ['marry', 'material', 'materiel'], 886 | 'metal': ['medal', 'meddle', 'mettle'], 887 | 'mete': ['meat', 'meet'], 888 | 'meter': ['metre'], 889 | 'metre': ['meter'], 890 | 'mettle': ['medal', 'meddle', 'metal'], 891 | 'mewl': ['mule'], 892 | 'mews': ['muse'], 893 | 'mi': ['me'], 894 | 'mien': ['mean'], 895 | 'might': ['mite'], 896 | 'mil': ['mill'], 897 | 'mill': ['mil'], 898 | 'millinary': ['millinery'], 899 | 'millinery': ['millinary'], 900 | 'mince': ['mints'], 901 | 'mind': ['mined'], 902 | 'mined': ['mind'], 903 | 'miner': ['minor', 'mynah'], 904 | 'minor': ['miner', 'mynah'], 905 | 'mints': ['mince'], 906 | 'missal': ['missile'], 907 | 'missed': ['mist'], 908 | 'missile': ['missal'], 909 | 'mist': ['missed'], 910 | 'mite': ['might'], 911 | 'moan': ['mown'], 912 | 'moat': ['mote'], 913 | 'mode': ['mowed'], 914 | 'moor': ['maw', 'more'], 915 | 'moose': ['mousse'], 916 | 'more': ['maw', 'moor'], 917 | 'morn': ['mourn'], 918 | 'morning': ['mourning'], 919 | 'mote': ['moat'], 920 | 'mourn': ['morn'], 921 | 'mourning': ['morning'], 922 | 'mousse': ['moose'], 923 | 'mouton': ['mutton'], 924 | 'mowed': ['mode'], 925 | 'mown': ['moan'], 926 | 'mule': ['mewl'], 927 | 'munificent': ['magnificent'], 928 | 'muscle': ['mussel', 'muzzle'], 929 | 'muse': ['mews'], 930 | 'mussel': ['muscle', 'muzzle'], 931 | 'mustard': ['mustered'], 932 | 'mustered': ['mustard'], 933 | 'mutton': ['mouton'], 934 | 'muzzle': ['muscle', 'mussel'], 935 | 'mynah': ['miner', 'minor'], 936 | 'naval': ['navel'], 937 | 'nave': ['knave'], 938 | 'navel': ['naval'], 939 | 'naw': ['gnaw', 'nor'], 940 | 'nay': ['neigh'], 941 | 'need': ['knead', 'kneed'], 942 | 'neigh': ['nay'], 943 | 'new': ['gnu', 'knew'], 944 | 'nice': ['gneiss'], 945 | 'nicks': ['nix'], 946 | 'nigh': ['nye'], 947 | 'night': ['knight'], 948 | 'nine': ['9'], 949 | 'nineteen': ['19'], 950 | 'ninety': ['90'], 951 | 'ninety-eight': ['98'], 952 | 'ninety-five': ['95'], 953 | 'ninety-four': ['94'], 954 | 'ninety-nine': ['99'], 955 | 'ninety-one': ['91'], 956 | 'ninety-seven': ['97'], 957 | 'ninety-six': ['96'], 958 | 'ninety-three': ['93'], 959 | 'ninety-two': ['92'], 960 | 'nit': ['knit'], 961 | 'nix': ['nicks'], 962 | 'no': ['know'], 963 | 'nob': ['knob'], 964 | 'nock': ['knock'], 965 | 'none': ['nun'], 966 | 'nor': ['gnaw', 'naw'], 967 | 'normal': ['average', 'median'], 968 | 'nose': ['knows'], 969 | 'not': ['knot'], 970 | 'nun': ['none'], 971 | 'nye': ['nigh'], 972 | 'oar': ['awe', 'oh', 'or', 'ore', 'owe'], 973 | 'od': ['odd'], 974 | 'odd': ['od'], 975 | 'ode': ['owed'], 976 | 'official': ['officious'], 977 | 'officious': ['official'], 978 | 'oh': ['awe', 'oar', 'or', 'ore', 'owe'], 979 | 'one': ['1', 'won'], 980 | 'one hundred': ['100'], 981 | 'or': ['awe', 'oar', 'oh', 'ore', 'owe'], 982 | 'oracle': ['auricle'], 983 | 'oral': ['aural'], 984 | 'orc': ['auk'], 985 | 'ore': ['awe', 'oar', 'oh', 'or', 'owe'], 986 | 'oscillate': ['osculate'], 987 | 'osculate': ['oscillate'], 988 | 'ought': ['aught'], 989 | 'our': ['hour'], 990 | 'overdo': ['overdue'], 991 | 'overdue': ['overdo'], 992 | 'overseas': ['oversees'], 993 | 'oversees': ['overseas'], 994 | 'owe': ['awe', 'oar', 'oh', 'or', 'ore'], 995 | 'owed': ['ode'], 996 | 'paced': ['paste'], 997 | 'packed': ['pact'], 998 | 'packs': ['pax'], 999 | 'pact': ['packed'], 1000 | 'paean': ['peon'], 1001 | 'pail': ['pale'], 1002 | 'pain': ['pane'], 1003 | 'pair': ['pare', 'pear'], 1004 | 'palate': ['palette', 'pallet'], 1005 | 'pale': ['pail'], 1006 | 'palette': ['palate', 'pallet'], 1007 | 'pall': ['pawl'], 1008 | 'pallet': ['palate', 'palette'], 1009 | 'paltry': ['poultry'], 1010 | 'pane': ['pain'], 1011 | 'parameter': ['perimeter'], 1012 | 'pare': ['pair', 'pear'], 1013 | 'parish': ['perish'], 1014 | 'pascal': ['paschal'], 1015 | 'paschal': ['pascal'], 1016 | 'passed': ['past'], 1017 | 'past': ['passed'], 1018 | 'paste': ['paced'], 1019 | 'paten': ['patten', 'pattern'], 1020 | 'patience': ['patients'], 1021 | 'patients': ['patience'], 1022 | 'patten': ['paten', 'pattern'], 1023 | 'pattern': ['paten', 'patten'], 1024 | 'paul': ['pole', 'poll', 'pull'], 1025 | 'pause': ['paws', 'pores', 'pours'], 1026 | 'pawl': ['pall'], 1027 | 'pawn': ['porn'], 1028 | 'paws': ['pause', 'pores', 'pours'], 1029 | 'pax': ['packs'], 1030 | 'pea': ['pee'], 1031 | 'peace': ['piece'], 1032 | 'peak': ['peek', 'peke', 'pique'], 1033 | 'peal': ['peel'], 1034 | 'pear': ['pair', 'pare'], 1035 | 'pearl': ['purl'], 1036 | 'pedal': ['peddle'], 1037 | 'peddle': ['pedal'], 1038 | 'pee': ['pea'], 1039 | 'peek': ['peak', 'peke', 'pique'], 1040 | 'peel': ['peal'], 1041 | 'peer': ['pier', 'pure'], 1042 | 'peke': ['peak', 'peek', 'pique'], 1043 | 'peon': ['paean'], 1044 | 'peremptory': ['pre-emptory'], 1045 | 'perimeter': ['parameter'], 1046 | 'perish': ['parish'], 1047 | 'perquisite': ['prerequisite'], 1048 | 'persecute': ['prosecute'], 1049 | 'personal': ['personnel'], 1050 | 'personnel': ['personal'], 1051 | 'perspective': ['prospective'], 1052 | 'petit': ['petite', 'petty'], 1053 | 'petite': ['petit', 'petty'], 1054 | 'petty': ['petit', 'petite'], 1055 | 'phase': ['faze'], 1056 | 'phew': ['few'], 1057 | 'phi': ['fie'], 1058 | 'phial': ['file'], 1059 | 'phiz': ['fizz'], 1060 | 'phrase': ['frays'], 1061 | 'physic': ['physique', 'psychic'], 1062 | 'physique': ['physic', 'psychic'], 1063 | 'pi': ['pie'], 1064 | 'pica': ['pika'], 1065 | 'pie': ['pi'], 1066 | 'piece': ['peace'], 1067 | 'pier': ['peer', 'pure'], 1068 | 'pika': ['pica'], 1069 | 'pique': ['peak', 'peek', 'peke'], 1070 | 'place': ['plaice'], 1071 | 'plaice': ['place'], 1072 | 'plain': ['plane'], 1073 | 'plait': ['plate'], 1074 | 'plane': ['plain'], 1075 | 'plate': ['plait'], 1076 | 'pleas': ['please'], 1077 | 'please': ['pleas'], 1078 | 'plum': ['plumb'], 1079 | 'plumb': ['plum'], 1080 | 'pole': ['paul', 'poll', 'pull'], 1081 | 'policy': ['polity'], 1082 | 'polity': ['policy'], 1083 | 'poll': ['paul', 'pole', 'pull'], 1084 | 'poof': ['pouffe'], 1085 | 'poor': ['pore', 'pour'], 1086 | 'poplar': ['popular'], 1087 | 'populace': ['populous'], 1088 | 'popular': ['poplar'], 1089 | 'populous': ['populace'], 1090 | 'pore': ['poor', 'pour'], 1091 | 'pores': ['pause', 'paws', 'pours'], 1092 | 'porn': ['pawn'], 1093 | 'pouffe': ['poof'], 1094 | 'poultry': ['paltry'], 1095 | 'pour': ['poor', 'pore'], 1096 | 'pours': ['pause', 'paws', 'pores'], 1097 | 'practice': ['practise'], 1098 | 'practise': ['practice'], 1099 | 'praise': ['prays', 'preys'], 1100 | 'pray': ['prey'], 1101 | 'prays': ['praise', 'preys'], 1102 | 'pre-emptory': ['peremptory'], 1103 | 'precede': ['proceed'], 1104 | 'prerequisite': ['perquisite'], 1105 | 'prescribe': ['proscribe'], 1106 | 'presence': ['presents'], 1107 | 'presentiment': ['presentment'], 1108 | 'presentment': ['presentiment'], 1109 | 'presents': ['presence'], 1110 | 'prey': ['pray'], 1111 | 'preys': ['praise', 'prays'], 1112 | 'pride': ['pried'], 1113 | 'pried': ['pride'], 1114 | 'pries': ['prize'], 1115 | 'primer': ['primmer'], 1116 | 'primmer': ['primer'], 1117 | 'prince': ['prints'], 1118 | 'principal': ['principle'], 1119 | 'principle': ['principal'], 1120 | 'prints': ['prince'], 1121 | 'prize': ['pries'], 1122 | 'proceed': ['precede'], 1123 | 'profit': ['prophet'], 1124 | 'prone': ['supine'], 1125 | 'prophecy': ['prophesy'], 1126 | 'prophesy': ['prophecy'], 1127 | 'prophet': ['profit'], 1128 | 'propose': ['purpose'], 1129 | 'proscribe': ['prescribe'], 1130 | 'prosecute': ['persecute'], 1131 | 'prospective': ['perspective'], 1132 | 'prostate': ['prostrate'], 1133 | 'prostrate': ['prostate'], 1134 | 'psychic': ['physic', 'physique'], 1135 | 'pull': ['paul', 'pole', 'poll'], 1136 | 'pure': ['peer', 'pier'], 1137 | 'purl': ['pearl'], 1138 | 'purpose': ['propose'], 1139 | 'put': ['putt'], 1140 | 'putt': ['put'], 1141 | 'quarts': ['quartz'], 1142 | 'quartz': ['quarts'], 1143 | 'quay': ['key'], 1144 | 'quean': ['queen'], 1145 | 'queen': ['quean'], 1146 | 'queue': ['cue', 'kyu'], 1147 | 'quire': ['choir'], 1148 | 'r': ['are'], 1149 | 'rabbet': ['rabbit'], 1150 | 'rabbit': ['rabbet'], 1151 | 'rack': ['wrack'], 1152 | 'rain': ['reign', 'rein'], 1153 | 'raise': ['rays', 'raze'], 1154 | 'rap': ['rapped', 'rapt', 'wrap', 'wrapped'], 1155 | 'rapped': ['rap', 'rapt', 'wrap', 'wrapped'], 1156 | 'rapt': ['rap', 'rapped', 'wrap', 'wrapped'], 1157 | 'rate': ['right', 'rite', 'wright', 'write'], 1158 | 'raw': ['roar'], 1159 | 'rays': ['raise', 'raze'], 1160 | 'raze': ['raise', 'rays'], 1161 | 'read': ['red', 'reed'], 1162 | 'real': ['reel'], 1163 | 'reality': ['realty'], 1164 | 'realty': ['reality'], 1165 | 'red': ['read', 'reed'], 1166 | 'reed': ['read', 'red'], 1167 | 'reek': ['wreak'], 1168 | 'reel': ['real'], 1169 | 'register': ['registrar'], 1170 | 'registrar': ['register'], 1171 | 'reign': ['rain', 'rein'], 1172 | 'rein': ['rain', 'reign'], 1173 | 'reluctant': ['reticent'], 1174 | 'residence': ['residents'], 1175 | 'residents': ['residence'], 1176 | 'rest': ['rust', 'wrest'], 1177 | 'retch': ['wretch'], 1178 | 'reticent': ['reluctant'], 1179 | 'review': ['revue'], 1180 | 'revue': ['review'], 1181 | 'rheum': ['room'], 1182 | 'rho': ['roe', 'row'], 1183 | 'riffle': ['rifle'], 1184 | 'rifle': ['riffle'], 1185 | 'rigger': ['rigor'], 1186 | 'right': ['rate', 'rite', 'wright', 'write'], 1187 | 'rigor': ['rigger'], 1188 | 'ring': ['wring'], 1189 | 'rite': ['rate', 'right', 'wright', 'write'], 1190 | 'road': ['rode', 'rowed'], 1191 | 'roar': ['raw'], 1192 | 'rode': ['road', 'rowed'], 1193 | 'roe': ['rho', 'row'], 1194 | 'roil': ['royal'], 1195 | 'role': ['roll'], 1196 | 'roll': ['role'], 1197 | 'roo': ['roux', 'rue'], 1198 | 'rood': ['rude', 'rued'], 1199 | 'room': ['rheum'], 1200 | 'roomer': ['rumour'], 1201 | 'root': ['route'], 1202 | 'rose': ['rouse', 'rows'], 1203 | 'rota': ['rotor'], 1204 | 'rote': ['wrote'], 1205 | 'rotor': ['rota'], 1206 | 'rough': ['ruff'], 1207 | 'rouse': ['rose', 'rows'], 1208 | 'route': ['root'], 1209 | 'roux': ['roo', 'rue'], 1210 | 'row': ['rho', 'roe'], 1211 | 'rowed': ['road', 'rode'], 1212 | 'rows': ['rose', 'rouse'], 1213 | 'royal': ['roil'], 1214 | 'rude': ['rood', 'rued'], 1215 | 'rue': ['roo', 'roux'], 1216 | 'rued': ['rood', 'rude'], 1217 | 'ruff': ['rough'], 1218 | 'ruin': ['rune'], 1219 | 'rumour': ['roomer'], 1220 | 'rune': ['ruin'], 1221 | 'rung': ['wrung'], 1222 | 'rust': ['rest', 'wrest'], 1223 | 'rye': ['wry'], 1224 | 'sac': ['sack'], 1225 | 'sachet': ['sashay'], 1226 | 'sack': ['sac'], 1227 | 'sail': ['sale'], 1228 | 'sale': ['sail'], 1229 | 'sane': ['seine'], 1230 | 'sanitarium': ['sanitorium'], 1231 | 'sanitorium': ['sanitarium'], 1232 | 'sashay': ['sachet'], 1233 | 'satire': ['satyr'], 1234 | 'satyr': ['satire'], 1235 | 'sauce': ['source'], 1236 | 'saver': ['savour'], 1237 | 'savour': ['saver'], 1238 | 'saw': ['sew', 'so', 'soar', 'sore', 'sow'], 1239 | 'scene': ['seen'], 1240 | 'scent': ['cent', 'sent'], 1241 | 'scull': ['skull'], 1242 | 'sea': ['see'], 1243 | 'sealing': ['ceiling'], 1244 | 'seam': ['seem'], 1245 | 'seaman': ['semen'], 1246 | 'sear': ['seer', 'sere'], 1247 | 'seas': ['sees', 'seize'], 1248 | 'see': ['sea'], 1249 | 'seed': ['cede'], 1250 | 'seem': ['seam'], 1251 | 'seen': ['scene'], 1252 | 'seer': ['sear', 'sere'], 1253 | 'sees': ['seas', 'seize'], 1254 | 'seine': ['sane'], 1255 | 'seize': ['seas', 'sees'], 1256 | 'sell': ['cell'], 1257 | 'seller': ['cellar'], 1258 | 'semen': ['seaman'], 1259 | 'sense': ['census'], 1260 | 'sensor': ['censer', 'censor', 'censure'], 1261 | 'sent': ['cent', 'scent'], 1262 | 'sere': ['sear', 'seer'], 1263 | 'serf': ['surf'], 1264 | 'serge': ['surge'], 1265 | 'serial': ['cereal'], 1266 | 'session': ['cession'], 1267 | 'seven': ['7'], 1268 | 'seventeen': ['17'], 1269 | 'seventy': ['70'], 1270 | 'seventy-eight': ['78'], 1271 | 'seventy-five': ['75'], 1272 | 'seventy-four': ['74'], 1273 | 'seventy-nine': ['79'], 1274 | 'seventy-one': ['71'], 1275 | 'seventy-seven': ['77'], 1276 | 'seventy-six': ['76'], 1277 | 'seventy-three': ['73'], 1278 | 'seventy-two': ['72'], 1279 | 'sew': ['saw', 'so', 'soar', 'sore', 'sow'], 1280 | 'shake': ['sheikh'], 1281 | 'shanty': ['chantey'], 1282 | 'shear': ['shearn', 'sheer'], 1283 | 'shearn': ['shear', 'sheer'], 1284 | 'sheer': ['shear', 'shearn'], 1285 | 'sheik': ['chic'], 1286 | 'sheikh': ['shake'], 1287 | 'shoe': ['shoo'], 1288 | 'shone': ['shown'], 1289 | 'shoo': ['shoe'], 1290 | 'shoot': ['chute'], 1291 | 'shown': ['shone'], 1292 | 'sic': ['sick'], 1293 | 'sick': ['sic'], 1294 | 'side': ['sighed'], 1295 | 'sighed': ['side'], 1296 | 'sighs': ['size'], 1297 | 'sight': ['cite', 'site'], 1298 | 'sign': ['sine'], 1299 | 'signet': ['cygnet'], 1300 | 'sine': ['sign'], 1301 | 'sink': ['synch'], 1302 | 'site': ['cite', 'sight'], 1303 | 'six': ['6'], 1304 | 'sixteen': ['16'], 1305 | 'sixty': ['60'], 1306 | 'sixty-eight': ['68'], 1307 | 'sixty-five': ['65'], 1308 | 'sixty-four': ['64'], 1309 | 'sixty-nine': ['69'], 1310 | 'sixty-one': ['61'], 1311 | 'sixty-seven': ['67'], 1312 | 'sixty-six': ['66'], 1313 | 'sixty-three': ['63'], 1314 | 'sixty-two': ['62'], 1315 | 'size': ['sighs'], 1316 | 'skull': ['scull'], 1317 | 'slay': ['sleigh'], 1318 | 'sleigh': ['slay'], 1319 | 'sleight': ['slight'], 1320 | 'slight': ['sleight'], 1321 | 'sloe': ['slow'], 1322 | 'slow': ['sloe'], 1323 | 'so': ['saw', 'sew', 'soar', 'sore', 'sow'], 1324 | 'soar': ['saw', 'sew', 'so', 'sore', 'sow'], 1325 | 'soared': ['sward', 'sword'], 1326 | 'sol': ['sole', 'soul'], 1327 | 'sold': ['soled'], 1328 | 'sole': ['sol', 'soul'], 1329 | 'soled': ['sold'], 1330 | 'some': ['sum'], 1331 | 'son': ['sun'], 1332 | 'sore': ['saw', 'sew', 'so', 'soar', 'sow'], 1333 | 'sort': ['sought'], 1334 | 'sought': ['sort'], 1335 | 'soul': ['sol', 'sole'], 1336 | 'source': ['sauce'], 1337 | 'sow': ['saw', 'sew', 'so', 'soar', 'sore'], 1338 | 'spa': ['spar'], 1339 | 'spade': ['spayed'], 1340 | 'spar': ['spa'], 1341 | 'spayed': ['spade'], 1342 | 'spoor': ['spore'], 1343 | 'spore': ['spoor'], 1344 | 'staid': ['stayed'], 1345 | 'stair': ['stare'], 1346 | 'stairs': ['stares'], 1347 | 'stake': ['steak'], 1348 | 'stalk': ['stork'], 1349 | 'stare': ['stair'], 1350 | 'stares': ['stairs'], 1351 | 'stationary': ['stationery'], 1352 | 'stationery': ['stationary'], 1353 | 'stayed': ['staid'], 1354 | 'steak': ['stake'], 1355 | 'steal': ['steel'], 1356 | 'steel': ['steal'], 1357 | 'step': ['steppe'], 1358 | 'steppe': ['step'], 1359 | 'stile': ['sty', 'style'], 1360 | 'storey': ['story'], 1361 | 'stork': ['stalk'], 1362 | 'story': ['storey'], 1363 | 'straight': ['strait'], 1364 | 'strait': ['straight'], 1365 | 'sty': ['stile', 'style'], 1366 | 'style': ['stile', 'sty'], 1367 | 'succour': ['sucker'], 1368 | 'sucker': ['succour'], 1369 | 'suit': ['suite', 'sweet'], 1370 | 'suite': ['suit', 'sweet'], 1371 | 'sum': ['some'], 1372 | 'summary': ['summery'], 1373 | 'summery': ['summary'], 1374 | 'sun': ['son'], 1375 | 'supine': ['prone'], 1376 | 'surf': ['serf'], 1377 | 'surge': ['serge'], 1378 | 'sward': ['soared', 'sword'], 1379 | 'swat': ['swot'], 1380 | 'sweet': ['suit', 'suite'], 1381 | 'sword': ['soared', 'sward'], 1382 | 'swot': ['swat'], 1383 | 'symbol': ['cymbal', 'cymbol'], 1384 | 'synch': ['sink'], 1385 | 'tacet': ['tacit'], 1386 | 'tacit': ['tacet'], 1387 | 'tacked': ['tact'], 1388 | 'tacks': ['tax'], 1389 | 'tact': ['tacked'], 1390 | 'tail': ['tale'], 1391 | 'take': ['bring'], 1392 | 'tale': ['tail'], 1393 | 'talesman': ['talisman'], 1394 | 'talisman': ['talesman'], 1395 | 'talk': ['torque'], 1396 | 'taper': ['tapir'], 1397 | 'tapir': ['taper'], 1398 | 'tare': ['tear', 'tier'], 1399 | 'tasteful': ['tasty'], 1400 | 'tasty': ['tasteful'], 1401 | 'taught': ['taut', 'tort'], 1402 | 'taupe': ['tope'], 1403 | 'taut': ['taught', 'tort'], 1404 | 'tax': ['tacks'], 1405 | 'te': ['tea', 'tee'], 1406 | 'tea': ['te', 'tee'], 1407 | 'team': ['teem'], 1408 | 'tear': ['tare', 'tier'], 1409 | 'teas': ['tease'], 1410 | 'tease': ['teas'], 1411 | 'tee': ['te', 'tea'], 1412 | 'teem': ['team'], 1413 | 'ten': ['10'], 1414 | 'tense': ['tents'], 1415 | 'tents': ['tense'], 1416 | 'terce': ['terse'], 1417 | 'tern': ['turn'], 1418 | 'terse': ['terce'], 1419 | 'than': ['then'], 1420 | 'their': ['there', "they're"], 1421 | 'then': ['than'], 1422 | 'there': ['their', "they're"], 1423 | "they're": ['their', 'there'], 1424 | 'thirteen': ['13'], 1425 | 'thirty': ['30'], 1426 | 'thirty-eight': ['38'], 1427 | 'thirty-five': ['35'], 1428 | 'thirty-four': ['34'], 1429 | 'thirty-nine': ['39'], 1430 | 'thirty-one': ['31'], 1431 | 'thirty-seven': ['37'], 1432 | 'thirty-six': ['36'], 1433 | 'thirty-three': ['33'], 1434 | 'thirty-two': ['32'], 1435 | 'three': ['3'], 1436 | 'threw': ['through'], 1437 | 'throe': ['throw'], 1438 | 'throes': ['throws'], 1439 | 'throne': ['thrown'], 1440 | 'through': ['threw'], 1441 | 'throw': ['throe'], 1442 | 'thrown': ['throne'], 1443 | 'throws': ['throes'], 1444 | 'thyme': ['time'], 1445 | 'tic': ['tick'], 1446 | 'tick': ['tic'], 1447 | 'tide': ['tied'], 1448 | 'tied': ['tide'], 1449 | 'tier': ['tare', 'tear'], 1450 | 'time': ['thyme'], 1451 | 'tire': ['tyre'], 1452 | 'to': ['2', 'toe', 'too', 'tow', 'two'], 1453 | 'toad': ['toed', 'towed'], 1454 | 'tocsin': ['toxin'], 1455 | 'toe': ['2', 'to', 'too', 'tow', 'two'], 1456 | 'toed': ['toad', 'towed'], 1457 | 'told': ['tolled'], 1458 | 'tole': ['toll'], 1459 | 'toll': ['tole'], 1460 | 'tolled': ['told'], 1461 | 'ton': ['tun'], 1462 | 'too': ['2', 'to', 'toe', 'tow', 'two'], 1463 | 'tool': ['tulle'], 1464 | 'tope': ['taupe'], 1465 | 'tor': ['tore'], 1466 | 'tore': ['tor'], 1467 | 'torque': ['talk'], 1468 | 'tort': ['taught', 'taut'], 1469 | 'tortuous': ['torturous'], 1470 | 'torturous': ['tortuous'], 1471 | 'tough': ['tuff'], 1472 | 'tow': ['2', 'to', 'toe', 'too', 'two'], 1473 | 'towed': ['toad', 'toed'], 1474 | 'toxin': ['tocsin'], 1475 | 'track': ['tracked', 'tract'], 1476 | 'tracked': ['track', 'tract'], 1477 | 'tract': ['track', 'tracked'], 1478 | 'tray': ['trey'], 1479 | 'trey': ['tray'], 1480 | 'troop': ['troupe'], 1481 | 'troupe': ['troop'], 1482 | 'trussed': ['trust'], 1483 | 'trust': ['trussed'], 1484 | 'trustee': ['trusty'], 1485 | 'trusty': ['trustee'], 1486 | 'tuba': ['tuber'], 1487 | 'tuber': ['tuba'], 1488 | 'tuff': ['tough'], 1489 | 'tulle': ['tool'], 1490 | 'tun': ['ton'], 1491 | 'turban': ['turbine'], 1492 | 'turbine': ['turban'], 1493 | 'turn': ['tern'], 1494 | 'twelve': ['12'], 1495 | 'twenty': ['20'], 1496 | 'twenty-eight': ['28'], 1497 | 'twenty-five': ['25'], 1498 | 'twenty-four': ['24'], 1499 | 'twenty-nine': ['29'], 1500 | 'twenty-one': ['21'], 1501 | 'twenty-seven': ['27'], 1502 | 'twenty-six': ['26'], 1503 | 'twenty-three': ['23'], 1504 | 'twenty-two': ['22'], 1505 | 'two': ['2', 'to', 'toe', 'too', 'tow'], 1506 | 'tyre': ['tire'], 1507 | 'undo': ['undue'], 1508 | 'undue': ['undo'], 1509 | 'up': ['upped'], 1510 | 'upped': ['up'], 1511 | 'urn': ['earn'], 1512 | 'use': ['ewes', 'yews'], 1513 | 'vain': ['vane', 'vein'], 1514 | 'valance': ['valence'], 1515 | 'vale': ['veil'], 1516 | 'valence': ['valance'], 1517 | 'vane': ['vain', 'vein'], 1518 | 'vary': ['very'], 1519 | 'veil': ['vale'], 1520 | 'vein': ['vain', 'vane'], 1521 | 'veracious': ['voracious'], 1522 | 'very': ['vary'], 1523 | 'vial': ['vile', 'viol'], 1524 | 'vice': ['vise'], 1525 | 'vicious': ['viscous', 'viscus'], 1526 | 'vile': ['vial', 'viol'], 1527 | 'villain': ['villein'], 1528 | 'villein': ['villain'], 1529 | 'viol': ['vial', 'vile'], 1530 | 'virtu': ['virtue'], 1531 | 'virtue': ['virtu'], 1532 | 'viscous': ['vicious', 'viscus'], 1533 | 'viscus': ['vicious', 'viscous'], 1534 | 'vise': ['vice'], 1535 | 'voracious': ['veracious'], 1536 | 'wade': ['weighed'], 1537 | 'wail': ['wale', 'whale'], 1538 | 'wain': ['wane'], 1539 | 'waist': ['waste'], 1540 | 'wait': ['weight'], 1541 | 'waive': ['wave'], 1542 | 'wale': ['wail', 'whale'], 1543 | 'wall': ['waul'], 1544 | 'wane': ['wain'], 1545 | 'want': ['wont'], 1546 | 'war': ['wore'], 1547 | 'ware': ['wear', 'where'], 1548 | 'wares': ['wears'], 1549 | 'warn': ['worn'], 1550 | 'wart': ['wort'], 1551 | 'waste': ['waist'], 1552 | 'watt': ['what'], 1553 | 'waul': ['wall'], 1554 | 'wave': ['waive'], 1555 | 'wax': ['whacks'], 1556 | 'way': ['weigh', 'whey'], 1557 | 'we': ['wee', 'whee'], 1558 | "we'd": ['weed'], 1559 | "we'll": ['weal', 'wheel'], 1560 | "we're": ['weir'], 1561 | 'weak': ['week'], 1562 | 'weal': ["we'll", 'wheel'], 1563 | 'wean': ['ween'], 1564 | 'wear': ['ware', 'where'], 1565 | 'wears': ['wares'], 1566 | 'weather': ['wether', 'whether'], 1567 | 'weaver': ['weever'], 1568 | 'wee': ['we', 'whee'], 1569 | 'weed': ["we'd"], 1570 | 'week': ['weak'], 1571 | 'ween': ['wean'], 1572 | 'weever': ['weaver'], 1573 | 'weigh': ['way', 'whey'], 1574 | 'weighed': ['wade'], 1575 | 'weight': ['wait'], 1576 | 'weir': ["we're"], 1577 | 'were': ['whirr'], 1578 | 'wet': ['whet'], 1579 | 'wether': ['weather', 'whether'], 1580 | 'whacks': ['wax'], 1581 | 'whale': ['wail', 'wale'], 1582 | 'what': ['watt'], 1583 | 'wheald': ['wheeled'], 1584 | 'whee': ['we', 'wee'], 1585 | 'wheel': ["we'll", 'weal'], 1586 | 'wheeled': ['wheald'], 1587 | 'where': ['ware', 'wear'], 1588 | 'whet': ['wet'], 1589 | 'whether': ['weather', 'wether'], 1590 | 'whey': ['way', 'weigh'], 1591 | 'which': ['witch'], 1592 | 'whig': ['wig'], 1593 | 'while': ['wile'], 1594 | 'whine': ['wine'], 1595 | 'whirl': ['whorl'], 1596 | 'whirled': ['world'], 1597 | 'whirr': ['were'], 1598 | 'whit': ['wit'], 1599 | 'white': ['wight'], 1600 | 'whither': ['wither'], 1601 | "who''s": ["who's", 'whose'], 1602 | "who's": ["who''s", 'whose'], 1603 | 'whoa': ['woe'], 1604 | 'whole': ['hole'], 1605 | 'wholly': ['holey', 'holy'], 1606 | 'whoop': ['hoop'], 1607 | 'whore': ['haw', 'hoar'], 1608 | 'whorl': ['whirl'], 1609 | 'whose': ["who''s", "who's"], 1610 | 'wig': ['whig'], 1611 | 'wight': ['white'], 1612 | 'wile': ['while'], 1613 | 'wine': ['whine'], 1614 | 'wit': ['whit'], 1615 | 'witch': ['which'], 1616 | 'wither': ['whither'], 1617 | 'woe': ['whoa'], 1618 | 'won': ['1', 'one'], 1619 | 'wont': ['want'], 1620 | 'wood': ['would'], 1621 | 'wore': ['war'], 1622 | 'world': ['whirled'], 1623 | 'worn': ['warn'], 1624 | 'worst': ['wurst'], 1625 | 'wort': ['wart'], 1626 | 'would': ['wood'], 1627 | 'wrack': ['rack'], 1628 | 'wrap': ['rap', 'rapped', 'rapt', 'wrapped'], 1629 | 'wrapped': ['rap', 'rapped', 'rapt', 'wrap'], 1630 | 'wreak': ['reek'], 1631 | 'wrest': ['rest', 'rust'], 1632 | 'wretch': ['retch'], 1633 | 'wright': ['rate', 'right', 'rite', 'write'], 1634 | 'wring': ['ring'], 1635 | 'write': ['rate', 'right', 'rite', 'wright'], 1636 | 'wrote': ['rote'], 1637 | 'wrung': ['rung'], 1638 | 'wry': ['rye'], 1639 | 'wurst': ['worst'], 1640 | 'yaw': ['yore', "you''re", "you're", 'your'], 1641 | 'yew': ['ewe', 'you'], 1642 | 'yews': ['ewes', 'use'], 1643 | 'yoke': ['yolk'], 1644 | 'yolk': ['yoke'], 1645 | 'yore': ['yaw', "you''re", "you're", 'your'], 1646 | 'you': ['ewe', 'yew'], 1647 | "you''re": ['yaw', 'yore', "you're", 'your'], 1648 | "you'll": ['yule'], 1649 | "you're": ['yaw', 'yore', "you''re", 'your'], 1650 | 'your': ['yaw', 'yore', "you''re", "you're"], 1651 | 'yule': ["you'll"]} --------------------------------------------------------------------------------