Conversation

How may I assist you today?

76 |

Transcript:

77 |

78 |

Answer:

79 |

80 |

\n", 131 | "\n", 144 | "\n", 145 | " \n", 146 | " \n", 147 | " \n", 148 | " \n", 149 | " \n", 150 | " \n", 151 | " \n", 152 | " \n", 153 | " \n", 154 | " \n", 155 | " \n", 156 | " \n", 157 | " \n", 158 | " \n", 159 | " \n", 160 | " \n", 161 | " \n", 162 | " \n", 163 | " \n", 164 | " \n", 165 | " \n", 166 | " \n", 167 | " \n", 168 | " \n", 169 | " \n", 170 | " \n", 171 | " \n", 172 | " \n", 173 | " \n", 174 | " \n", 175 | " \n", 176 | " \n", 177 | " \n", 178 | " \n", 179 | " \n", 180 | " \n", 181 | " \n", 182 | " \n", 183 | " \n", 184 | " \n", 185 | " \n", 186 | " \n", 187 | " \n", 188 | " \n", 189 | " \n", 190 | " \n", 191 | " \n", 192 | " \n", 193 | " \n", 194 | " \n", 195 | " \n", 196 | " \n", 197 | " \n", 198 | " \n", 199 | " \n", 200 | " \n", 201 | " \n", 202 | " \n", 203 | " \n", 204 | " \n", 205 | " \n", 206 | " \n", 207 | " \n", 208 | " \n", 209 | " \n", 210 | " \n", 211 | " \n", 212 | " \n", 213 | " \n", 214 | " \n", 215 | " \n", 216 | " \n", 217 | " \n", 218 | " \n", 219 | " \n", 220 | " \n", 221 | " \n", 222 | " \n", 223 | " \n", 224 | " \n", 225 | " \n", 226 | " \n", 227 | " \n", 228 | " \n", 229 | " \n", 230 | " \n", 231 | " \n", 232 | " \n", 233 | " \n", 234 | " \n", 235 | " \n", 236 | " \n", 237 | " \n", 238 | " \n", 239 | " \n", 240 | " \n", 241 | " \n", 242 | " \n", 243 | " \n", 244 | " \n", 245 | " \n", 246 | " \n", 247 | " \n", 248 | " \n", 249 | " \n", 250 | " \n", 251 | " \n", 252 | " \n", 253 | " \n", 254 | " \n", 255 | " \n", 256 | " \n", 257 | " \n", 258 | " \n", 259 | " \n", 260 | " \n", 261 | " \n", 262 | " \n", 263 | " \n", 264 | " \n", 265 | " \n", 266 | " \n", 267 | " \n", 268 | " \n", 269 | " \n", 270 | " \n", 271 | " \n", 272 | " \n", 273 | " \n", 274 | " \n", 275 | " \n", 276 | " \n", 277 | " \n", 278 | " \n", 279 | " \n", 280 | " \n", 281 | " \n", 282 | " \n", 283 | " \n", 284 | " \n", 285 | " \n", 286 | " \n", 287 | " \n", 288 | " \n", 289 | " \n", 290 | " \n", 291 | " \n", 292 | " \n", 293 | " \n", 294 | " \n", 295 | " \n", 296 | " \n", 297 | " \n", 298 | " \n", 299 | " \n", 300 | " \n", 301 | " \n", 302 | " \n", 303 | " \n", 304 | " \n", 305 | " \n", 306 | " \n", 307 | " \n", 308 | " \n", 309 | " \n", 310 | " \n", 311 | " \n", 312 | " \n", 313 | " \n", 314 | " \n", 315 | " \n", 316 | " \n", 317 | " \n", 318 | " \n", 319 | " \n", 320 | " \n", 321 | " \n", 322 | " \n", 323 | " \n", 324 | " \n", 325 | " \n", 326 | " \n", 327 | " \n", 328 | " \n", 329 | " \n", 330 | " \n", 331 | " \n", 332 | " \n", 333 | " \n", 334 | " \n", 335 | " \n", 336 | " \n", 337 | " \n", 338 | " \n", 339 | " \n", 340 | " \n", 341 | " \n", 342 | " \n", 343 | " \n", 344 | " \n", 345 | " \n", 346 | " \n", 347 | " \n", 348 | " \n", 349 | " \n", 350 | " \n", 351 | " \n", 352 | " \n", 353 | " \n", 354 | " \n", 355 | " \n", 356 | " \n", 357 | " \n", 358 | " \n", 359 | " \n", 360 | " \n", 361 | " \n", 362 | " \n", 363 | " \n", 364 | " \n", 365 | " \n", 366 | " \n", 367 | " \n", 368 | " \n", 369 | " \n", 370 | " \n", 371 | " \n", 372 | " \n", 373 | " \n", 374 | " \n", 375 | " \n", 376 | " \n", 377 | " \n", 378 | " \n", 379 | " \n", 380 | " \n", 381 | " \n", 382 | " \n", 383 | " \n", 384 | " \n", 385 | " \n", 386 | " \n", 387 | " \n", 388 | " \n", 389 | " \n", 390 | " \n", 391 | " \n", 392 | " \n", 393 | " \n", 394 | " \n", 395 | " \n", 396 | " \n", 397 | " \n", 398 | " \n", 399 | " \n", 400 | " \n", 401 | " \n", 402 | " \n", 403 | " \n", 404 | " \n", 405 | " \n", 406 | " \n", 407 | " \n", 408 | " \n", 409 | " \n", 410 | " \n", 411 | " \n", 412 | " \n", 413 | " \n", 414 | " \n", 415 | " \n", 416 | " \n", 417 | " \n", 418 | " \n", 419 | " \n", 420 | " \n", 421 | " \n", 422 | " \n", 423 | " \n", 424 | " \n", 425 | " \n", 426 | " \n", 427 | " \n", 428 | " \n", 429 | " \n", 430 | " \n", 431 | " \n", 432 | " \n", 433 | " \n", 434 | " \n", 435 | " \n", 436 | " \n", 437 | " \n", 438 | " \n", 439 | " \n", 440 | " \n", 441 | " \n", 442 | " \n", 443 | " \n", 444 | " \n", 445 | " \n", 446 | " \n", 447 | " \n", 448 | " \n", 449 | " \n", 450 | " \n", 451 | " \n", 452 | " \n", 453 | " \n", 454 | " \n", 455 | " \n", 456 | " \n", 457 | " \n", 458 | " \n", 459 | " \n", 460 | " \n", 461 | " \n", 462 | " \n", 463 | " \n", 464 | " \n", 465 | " \n", 466 | " \n", 467 | " \n", 468 | " \n", 469 | " \n", 470 | " \n", 471 | " \n", 472 | " \n", 473 | " \n", 474 | " \n", 475 | " \n", 476 | " \n", 477 | " \n", 478 | " \n", 479 | " \n", 480 | " \n", 481 | " \n", 482 | " \n", 483 | " \n", 484 | " \n", 485 | " \n", 486 | " \n", 487 | " \n", 488 | " \n", 489 | " \n", 490 | " \n", 491 | " \n", 492 | " \n", 493 | " \n", 494 | " \n", 495 | " \n", 496 | " \n", 497 | " \n", 498 | " \n", 499 | " \n", 500 | " \n", 501 | " \n", 502 | " \n", 503 | " \n", 504 | " \n", 505 | " \n", 506 | " \n", 507 | " \n", 508 | " \n", 509 | " \n", 510 | " \n", 511 | " \n", 512 | " \n", 513 | " \n", 514 | " \n", 515 | " \n", 516 | " \n", 517 | " \n", 518 | " \n", 519 | " \n", 520 | " \n", 521 | " \n", 522 | " \n", 523 | " \n", 524 | " \n", 525 | " \n", 526 | " \n", 527 | " \n", 528 | " \n", 529 | " \n", 530 | " \n", 531 | " \n", 532 | " \n", 533 | " \n", 534 | " \n", 535 | " \n", 536 | " \n", 537 | " \n", 538 | " \n", 539 | " \n", 540 | " \n", 541 | " \n", 542 | " \n", 543 | " \n", 544 | " \n", 545 | " \n", 546 | " \n", 547 | " \n", 548 | " \n", 549 | " \n", 550 | " \n", 551 | " \n", 552 | " \n", 553 | " \n", 554 | " \n", 555 | " \n", 556 | " \n", 557 | " \n", 558 | " \n", 559 | " \n", 560 | " \n", 561 | " \n", 562 | " \n", 563 | " \n", 564 | " \n", 565 | " \n", 566 | " \n", 567 | " \n", 568 | " \n", 569 | " \n", 570 | " \n", 571 | " \n", 572 | " \n", 573 | " \n", 574 | " \n", 575 | " \n", 576 | " \n", 577 | " \n", 578 | " \n", 579 | " \n", 580 | " \n", 581 | " \n", 582 | " \n", 583 | " \n", 584 | " \n", 585 | " \n", 586 | " \n", 587 | " \n", 588 | " \n", 589 | " \n", 590 | " \n", 591 | " \n", 592 | " \n", 593 | "

	TEXT	LEMMA	POS	DESC	TAG	DEP	SHAPE	ALPHA	STOP
0	The	the	DET	determiner	DT	det	Xxx	True	True
1	closest	close	ADJ	adjective	JJS	amod	xxxx	True	False
2	city	city	NOUN	noun	NN	nsubj	xxxx	True	False
3	to	to	ADP	adposition	IN	prep	xx	True	True
4	your	your	PRON	pronoun	PRP$	poss	xxxx	True	True
5	location	location	NOUN	noun	NN	pobj	xxxx	True	False
6	is	be	AUX	auxiliary	VBZ	ROOT	xx	True	True
7	Wajir	Wajir	PROPN	proper noun	NNP	attr	Xxxxx	True	False
8	in	in	ADP	adposition	IN	prep	xx	True	True
9	Kenya	Kenya	PROPN	proper noun	NNP	pobj	Xxxxx	True	False
10	.	.	PUNCT	punctuation	.	punct	.	False	False
11	Wajir	Wajir	PROPN	proper noun	NNP	nsubj	Xxxxx	True	False
12	(	(	PUNCT	punctuation	-LRB-	punct	(	False	False
13	Somali	Somali	PROPN	proper noun	NNP	nmod	Xxxxx	True	False
14	:	:	PUNCT	punctuation	:	punct	:	False	False
15	Wajeer	Wajeer	PROPN	proper noun	NNP	appos	Xxxxx	True	False
16	)	)	PUNCT	punctuation	-RRB-	punct	)	False	False
17	is	be	AUX	auxiliary	VBZ	ROOT	xx	True	True
18	the	the	DET	determiner	DT	det	xxx	True	True
19	capital	capital	NOUN	noun	NN	attr	xxxx	True	False
20	of	of	ADP	adposition	IN	prep	xx	True	True
21	the	the	DET	determiner	DT	det	xxx	True	True
22	Wajir	Wajir	PROPN	proper noun	NNP	compound	Xxxxx	True	False
23	County	County	PROPN	proper noun	NNP	pobj	Xxxxx	True	False
24	of	of	ADP	adposition	IN	prep	xx	True	True
25	Kenya	Kenya	PROPN	proper noun	NNP	pobj	Xxxxx	True	False
26	.	.	PUNCT	punctuation	.	punct	.	False	False
27	It	it	PRON	pronoun	PRP	nsubjpass	Xx	True	True
28	is	be	AUX	auxiliary	VBZ	auxpass	xx	True	True
29	situated	situate	VERB	verb	VBN	ROOT	xxxx	True	False
30	in	in	ADP	adposition	IN	prep	xx	True	True
31	the	the	DET	determiner	DT	det	xxx	True	True
32	former	former	ADJ	adjective	JJ	amod	xxxx	True	True
33	North	North	PROPN	proper noun	NNP	compound	Xxxxx	True	False
34	Eastern	Eastern	PROPN	proper noun	NNP	compound	Xxxxx	True	False
35	Province	Province	PROPN	proper noun	NNP	pobj	Xxxxx	True	False

\n", 594 | "

" 1085 | ] 1086 | }, 1087 | "metadata": {}, 1088 | "output_type": "display_data" 1089 | } 1090 | ], 1091 | "source": [ 1092 | "from spacy import displacy\n", 1093 | "\n", 1094 | "# Show POS and synthatic dependencies\n", 1095 | "displacy.render(doc, style=\"dep\", jupyter=True, options={'distance': 100})" 1096 | ] 1097 | }, 1098 | { 1099 | "cell_type": "markdown", 1100 | "id": "67356e31", 1101 | "metadata": {}, 1102 | "source": [ 1103 | "# Categorised Words" 1104 | ] 1105 | }, 1106 | { 1107 | "cell_type": "code", 1108 | "execution_count": 22, 1109 | "id": "73f46389", 1110 | "metadata": {}, 1111 | "outputs": [ 1112 | { 1113 | "name": "stdout", 1114 | "output_type": "stream", 1115 | "text": [ 1116 | "Wajir 37 42 ORG\n", 1117 | "Kenya 46 51 GPE\n", 1118 | "Wajir 53 58 PERSON\n", 1119 | "the Wajir County 94 110 GPE\n", 1120 | "Kenya 114 119 GPE\n", 1121 | "North Eastern Province 150 172 GPE\n" 1122 | ] 1123 | } 1124 | ], 1125 | "source": [ 1126 | "for ent in doc.ents:\n", 1127 | " print(ent.text, ent.start_char, ent.end_char, ent.label_)" 1128 | ] 1129 | }, 1130 | { 1131 | "cell_type": "code", 1132 | "execution_count": 23, 1133 | "id": "5614619f", 1134 | "metadata": {}, 1135 | "outputs": [ 1136 | { 1137 | "data": { 1138 | "text/html": [ 1139 | "

The closest city to your location is \n", 1140 | "\n", 1141 | " Wajir\n", 1142 | " ORG\n", 1143 | "\n", 1144 | " in \n", 1145 | "\n", 1146 | " Kenya\n", 1147 | " GPE\n", 1148 | "\n", 1149 | ". \n", 1150 | "\n", 1151 | " Wajir\n", 1152 | " PERSON\n", 1153 | "\n", 1154 | " (Somali: Wajeer) is the capital of \n", 1155 | "\n", 1156 | " the Wajir County\n", 1157 | " GPE\n", 1158 | "\n", 1159 | " of \n", 1160 | "\n", 1161 | " Kenya\n", 1162 | " GPE\n", 1163 | "\n", 1164 | ". It is situated in the former \n", 1165 | "\n", 1166 | " North Eastern Province\n", 1167 | " GPE\n", 1168 | "\n", 1169 | "

" 1170 | ], 1171 | "text/plain": [ 1172 | "" 1173 | ] 1174 | }, 1175 | "metadata": {}, 1176 | "output_type": "display_data" 1177 | } 1178 | ], 1179 | "source": [ 1180 | "displacy.render(doc, style=\"ent\", jupyter=True)" 1181 | ] 1182 | }, 1183 | { 1184 | "cell_type": "code", 1185 | "execution_count": 27, 1186 | "id": "7bd1e6de", 1187 | "metadata": {}, 1188 | "outputs": [], 1189 | "source": [ 1190 | "import spacy\n", 1191 | "nlp2 = spacy.load(\"en_core_web_md\")\n" 1192 | ] 1193 | }, 1194 | { 1195 | "cell_type": "code", 1196 | "execution_count": 38, 1197 | "id": "9923cb4c", 1198 | "metadata": {}, 1199 | "outputs": [], 1200 | "source": [ 1201 | "#Needed Functions\n", 1202 | "from collections import Counter\n", 1203 | "import spacy\n", 1204 | "from spacy.lang.en.stop_words import STOP_WORDS\n", 1205 | "\n", 1206 | "def lemmatize(doc):\n", 1207 | " return [token.lemma_ for token in doc if not\n", 1208 | " (token.is_punct or token.is_space or token.lower_ in STOP_WORDS)]\n", 1209 | "\n", 1210 | "def tf(w, doc):\n", 1211 | " c = 0\n", 1212 | " for token in doc:\n", 1213 | " if token.lemma_ == w:\n", 1214 | " c = c + 1\n", 1215 | " return c\n", 1216 | "\n", 1217 | "def idf(w,docs):\n", 1218 | " c = 0\n", 1219 | " num_docs = len(docs)\n", 1220 | " for doc in docs:\n", 1221 | " if tf(w, doc) > 0:\n", 1222 | " c = c + 1\n", 1223 | " return c / num_docs" 1224 | ] 1225 | }, 1226 | { 1227 | "cell_type": "code", 1228 | "execution_count": 39, 1229 | "id": "c5373530", 1230 | "metadata": {}, 1231 | "outputs": [ 1232 | { 1233 | "name": "stdout", 1234 | "output_type": "stream", 1235 | "text": [ 1236 | "The closest city to your location is Wajir in Kenya. Wajir (Somali: Wajeer) is the capital of the Wajir County of Kenya. It is situated in the former North Eastern Province\n" 1237 | ] 1238 | } 1239 | ], 1240 | "source": [ 1241 | "print(doc)" 1242 | ] 1243 | }, 1244 | { 1245 | "cell_type": "code", 1246 | "execution_count": 44, 1247 | "id": "3f8aec89", 1248 | "metadata": {}, 1249 | "outputs": [ 1250 | { 1251 | "data": { 1252 | "text/plain": [ 1253 | "2" 1254 | ] 1255 | }, 1256 | "execution_count": 44, 1257 | "metadata": {}, 1258 | "output_type": "execute_result" 1259 | } 1260 | ], 1261 | "source": [ 1262 | "#lemmatize(doc)\n", 1263 | "tf(\"Kenya\",doc)" 1264 | ] 1265 | }, 1266 | { 1267 | "cell_type": "code", 1268 | "execution_count": 56, 1269 | "id": "0cf32902", 1270 | "metadata": {}, 1271 | "outputs": [], 1272 | "source": [ 1273 | "from string import punctuation\n", 1274 | "from collections import Counter\n", 1275 | "from heapq import nlargest" 1276 | ] 1277 | }, 1278 | { 1279 | "cell_type": "code", 1280 | "execution_count": 61, 1281 | "id": "17da1522", 1282 | "metadata": {}, 1283 | "outputs": [ 1284 | { 1285 | "data": { 1286 | "text/plain": [ 1287 | "3" 1288 | ] 1289 | }, 1290 | "execution_count": 61, 1291 | "metadata": {}, 1292 | "output_type": "execute_result" 1293 | } 1294 | ], 1295 | "source": [ 1296 | "#How many Sentences\n", 1297 | "len(list(doc.sents))" 1298 | ] 1299 | }, 1300 | { 1301 | "cell_type": "code", 1302 | "execution_count": 63, 1303 | "id": "db1a54dd", 1304 | "metadata": {}, 1305 | "outputs": [], 1306 | "source": [ 1307 | "keyword = [ ]\n", 1308 | "stopwords = list(STOP_WORDS)\n", 1309 | "pos_tag = [ 'PROPN','ADJ', 'NOUN', 'VERB']\n", 1310 | "for token in doc:\n", 1311 | " if(token.text in stopwords or token.text in punctuation):\n", 1312 | " continue\n", 1313 | " if(token.pos_ in pos_tag):\n", 1314 | " keyword. append (token. text)" 1315 | ] 1316 | }, 1317 | { 1318 | "cell_type": "code", 1319 | "execution_count": 68, 1320 | "id": "1e5bc7f0", 1321 | "metadata": {}, 1322 | "outputs": [ 1323 | { 1324 | "data": { 1325 | "text/plain": [ 1326 | "Counter({The: 1,\n", 1327 | " closest: 1,\n", 1328 | " city: 1,\n", 1329 | " to: 1,\n", 1330 | " your: 1,\n", 1331 | " location: 1,\n", 1332 | " is: 1,\n", 1333 | " Wajir: 1,\n", 1334 | " in: 1,\n", 1335 | " Kenya: 1,\n", 1336 | " .: 1,\n", 1337 | " Wajir: 1,\n", 1338 | " (: 1,\n", 1339 | " Somali: 1,\n", 1340 | " :: 1,\n", 1341 | " Wajeer: 1,\n", 1342 | " ): 1,\n", 1343 | " is: 1,\n", 1344 | " the: 1,\n", 1345 | " capital: 1,\n", 1346 | " of: 1,\n", 1347 | " the: 1,\n", 1348 | " Wajir: 1,\n", 1349 | " County: 1,\n", 1350 | " of: 1,\n", 1351 | " Kenya: 1,\n", 1352 | " .: 1,\n", 1353 | " It: 1,\n", 1354 | " is: 1,\n", 1355 | " situated: 1,\n", 1356 | " in: 1,\n", 1357 | " the: 1,\n", 1358 | " former: 1,\n", 1359 | " North: 1,\n", 1360 | " Eastern: 1,\n", 1361 | " Province: 1})" 1362 | ] 1363 | }, 1364 | "execution_count": 68, 1365 | "metadata": {}, 1366 | "output_type": "execute_result" 1367 | } 1368 | ], 1369 | "source": [ 1370 | "freq=Counter(doc)\n", 1371 | "freq" 1372 | ] 1373 | }, 1374 | { 1375 | "cell_type": "code", 1376 | "execution_count": null, 1377 | "id": "877feb87", 1378 | "metadata": {}, 1379 | "outputs": [], 1380 | "source": [] 1381 | } 1382 | ], 1383 | "metadata": { 1384 | "kernelspec": { 1385 | "display_name": "Python 3 (ipykernel)", 1386 | "language": "python", 1387 | "name": "python3" 1388 | }, 1389 | "language_info": { 1390 | "codemirror_mode": { 1391 | "name": "ipython", 1392 | "version": 3 1393 | }, 1394 | "file_extension": ".py", 1395 | "mimetype": "text/x-python", 1396 | "name": "python", 1397 | "nbconvert_exporter": "python", 1398 | "pygments_lexer": "ipython3", 1399 | "version": "3.10.7" 1400 | } 1401 | }, 1402 | "nbformat": 4, 1403 | "nbformat_minor": 5 1404 | } 1405 | --------------------------------------------------------------------------------

Conversation Page

Conversational AI

How may I assist you today?