├── HashtagAnalysis
├── .classpath
├── .project
├── .settings
│ └── org.eclipse.jdt.core.prefs
├── HashtagAnalysis.xls
├── bin
│ ├── HMapper.class
│ ├── HReducer.class
│ └── HashtagAnalysis.class
├── build.xml
├── classes
│ ├── HMapper.class
│ ├── HReducer.class
│ └── HashtagAnalysis.class
├── dist
│ └── HashtagAnalysis.jar
├── out
│ └── HashtagAnalysis.txt
└── src
│ ├── HMapper.java
│ ├── HReducer.java
│ └── HashtagAnalysis.java
├── README.md
├── Report.pdf
├── TextAnalysis
├── .classpath
├── .project
├── .settings
│ └── org.eclipse.jdt.core.prefs
├── TextAnalysis.xls
├── bin
│ ├── TMapper.class
│ ├── TReducer.class
│ └── TextAnalysis.class
├── build.xml
├── classes
│ ├── TMapper.class
│ ├── TReducer.class
│ └── TextAnalysis.class
├── dist
│ └── TextAnalysis.jar
├── out
│ ├── TextAnalysis0.txt
│ └── TextAnalysis1.txt
└── src
│ ├── TMapper.java
│ ├── TReducer.java
│ └── TextAnalysis.java
├── TextAnalysisAvg
├── .classpath
├── .project
├── .settings
│ └── org.eclipse.jdt.core.prefs
├── bin
│ ├── TAvgMapper.class
│ ├── TAvgReducer.class
│ ├── TextAnalysisAvg.class
│ └── inintpair
│ │ └── IntIntPair.class
├── build.xml
├── classes
│ ├── TAvgMapper.class
│ ├── TAvgReducer.class
│ ├── TextAnalysisAvg.class
│ └── inintpair
│ │ └── IntIntPair.class
├── dist
│ └── TextAnalysisAvg.jar
├── out
│ └── TextAnalysisAvg.txt
└── src
│ ├── TAvgMapper.java
│ ├── TAvgReducer.java
│ ├── TextAnalysisAvg.java
│ └── inintpair
│ └── IntIntPair.java
└── TimeAnalysis
├── .classpath
├── .project
├── .settings
└── org.eclipse.jdt.core.prefs
├── TimeAnalysis.xls
├── bin
├── TimeAnalysis.class
├── TimeMapper.class
└── TimeReducer.class
├── build.xml
├── classes
├── TimeAnalysis.class
├── TimeMapper.class
└── TimeReducer.class
├── dist
└── TimeAnalysis.jar
├── out
└── TimeAnalysis.txt
└── src
├── TimeAnalysis.java
├── TimeMapper.java
└── TimeReducer.java
/HashtagAnalysis/.classpath:
--------------------------------------------------------------------------------
1 |
2 |
3 |
4 |
5 |
6 |
7 |
8 |
9 |
10 |
11 |
12 |
13 |
14 |
15 |
16 |
17 |
18 |
19 |
20 |
21 |
22 |
23 |
24 |
25 |
26 |
27 |
28 |
29 |
30 |
31 |
32 |
33 |
34 |
35 |
36 |
37 |
38 |
39 |
40 |
41 |
42 |
43 |
44 |
45 |
46 |
47 |
48 |
49 |
50 |
51 |
52 |
53 |
54 |
55 |
56 |
57 |
58 |
59 |
60 |
61 |
62 |
63 |
64 |
65 |
66 |
67 |
68 |
69 |
70 |
71 |
72 |
73 |
74 |
75 |
76 |
77 |
78 |
79 |
80 |
81 |
82 |
83 |
84 |
85 |
86 |
87 |
88 |
89 |
90 |
91 |
92 |
93 |
94 |
95 |
96 |
97 |
98 |
99 |
100 |
101 |
102 |
103 |
104 |
105 |
106 |
107 |
108 |
109 |
110 |
--------------------------------------------------------------------------------
/HashtagAnalysis/.project:
--------------------------------------------------------------------------------
1 |
2 |
3 | HashtagAnalysis
4 |
5 |
6 |
7 |
8 |
9 | org.eclipse.jdt.core.javabuilder
10 |
11 |
12 |
13 |
14 |
15 | org.eclipse.jdt.core.javanature
16 |
17 |
18 |
--------------------------------------------------------------------------------
/HashtagAnalysis/.settings/org.eclipse.jdt.core.prefs:
--------------------------------------------------------------------------------
1 | eclipse.preferences.version=1
2 | org.eclipse.jdt.core.compiler.codegen.inlineJsrBytecode=enabled
3 | org.eclipse.jdt.core.compiler.codegen.targetPlatform=1.7
4 | org.eclipse.jdt.core.compiler.codegen.unusedLocal=preserve
5 | org.eclipse.jdt.core.compiler.compliance=1.7
6 | org.eclipse.jdt.core.compiler.debug.lineNumber=generate
7 | org.eclipse.jdt.core.compiler.debug.localVariable=generate
8 | org.eclipse.jdt.core.compiler.debug.sourceFile=generate
9 | org.eclipse.jdt.core.compiler.problem.assertIdentifier=error
10 | org.eclipse.jdt.core.compiler.problem.enumIdentifier=error
11 | org.eclipse.jdt.core.compiler.source=1.7
12 |
--------------------------------------------------------------------------------
/HashtagAnalysis/HashtagAnalysis.xls:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Zhanelya/Big-Data-Project/98396ba359a10c2b90b22bcce8d8cf8f014c1f05/HashtagAnalysis/HashtagAnalysis.xls
--------------------------------------------------------------------------------
/HashtagAnalysis/bin/HMapper.class:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Zhanelya/Big-Data-Project/98396ba359a10c2b90b22bcce8d8cf8f014c1f05/HashtagAnalysis/bin/HMapper.class
--------------------------------------------------------------------------------
/HashtagAnalysis/bin/HReducer.class:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Zhanelya/Big-Data-Project/98396ba359a10c2b90b22bcce8d8cf8f014c1f05/HashtagAnalysis/bin/HReducer.class
--------------------------------------------------------------------------------
/HashtagAnalysis/bin/HashtagAnalysis.class:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Zhanelya/Big-Data-Project/98396ba359a10c2b90b22bcce8d8cf8f014c1f05/HashtagAnalysis/bin/HashtagAnalysis.class
--------------------------------------------------------------------------------
/HashtagAnalysis/build.xml:
--------------------------------------------------------------------------------
1 |
2 |
3 | Sample MapReduce project build file
4 |
5 |
6 |
7 |
8 |
9 |
10 |
11 |
12 |
13 |
14 |
15 |
16 |
17 |
18 |
19 |
20 |
21 |
22 |
23 |
24 |
25 |
26 |
27 |
28 |
29 |
30 |
31 |
32 |
33 |
34 |
35 |
36 |
37 |
38 |
39 |
40 |
41 |
42 |
43 |
44 |
45 |
46 |
47 |
48 |
49 |
50 |
--------------------------------------------------------------------------------
/HashtagAnalysis/classes/HMapper.class:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Zhanelya/Big-Data-Project/98396ba359a10c2b90b22bcce8d8cf8f014c1f05/HashtagAnalysis/classes/HMapper.class
--------------------------------------------------------------------------------
/HashtagAnalysis/classes/HReducer.class:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Zhanelya/Big-Data-Project/98396ba359a10c2b90b22bcce8d8cf8f014c1f05/HashtagAnalysis/classes/HReducer.class
--------------------------------------------------------------------------------
/HashtagAnalysis/classes/HashtagAnalysis.class:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Zhanelya/Big-Data-Project/98396ba359a10c2b90b22bcce8d8cf8f014c1f05/HashtagAnalysis/classes/HashtagAnalysis.class
--------------------------------------------------------------------------------
/HashtagAnalysis/dist/HashtagAnalysis.jar:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Zhanelya/Big-Data-Project/98396ba359a10c2b90b22bcce8d8cf8f014c1f05/HashtagAnalysis/dist/HashtagAnalysis.jar
--------------------------------------------------------------------------------
/HashtagAnalysis/out/HashtagAnalysis.txt:
--------------------------------------------------------------------------------
1 | 224
2 | 22indonesia 204
3 | 4gold 1916
4 | 4goldindia 255
5 | _gb 499
6 | africa 770
7 | al 394
8 | america 572
9 | at 989
10 | aus 920
11 | aussie 2261
12 | aussies 8216
13 | australia 1212
14 | autofollow 403
15 | bahamas 559
16 | bears 485
17 | belgium 505
18 | bg 244
19 | blake 200
20 | bletoffire 5276
21 | blue 662
22 | bolt 2007
23 | boomers 341
24 | boomersgo 255
25 | botswana 227
26 | brasil 749
27 | brazil 1441
28 | brijamada 300
29 | cana 218
30 | canad 216
31 | canada 19218
32 | canadago 9067
33 | caribbean 807
34 | caster 1426
35 | cav 510
36 | china 1177
37 | croatia 431
38 | d 333
39 | daley 671
40 | dblessamerica 451
41 | dsavethequeen 809
42 | ducks 469
43 | egypt 1107
44 | ennis 256
45 | ethiopia 1651
46 | fair2012 675
47 | federer 502
48 | follback 292
49 | followback 9000
50 | forgold 6163
51 | forthegold 865
52 | france 1224
53 | g 367
54 | gabby 1270
55 | gators 483
56 | gav 201
57 | gb 398581
58 | gbboxing 247
59 | gbfootball 224
60 | gbgymnastics 508
61 | gbr 624
62 | germany 532
63 | ghana 426
64 | girl 886
65 | girls 1194
66 | gold 386
67 | greatbritain 288
68 | green 331
69 | grenada 945
70 | haiti 740
71 | holland 206
72 | hungary 827
73 | ina 470
74 | india 1434
75 | indonesia 2442
76 | inforgold 400
77 | ingforgold 3608
78 | ingforthegold 294
79 | iran 570
80 | ireland 17798
81 | israel 1048
82 | italy 1052
83 | ja 1167
84 | jamaica 21033
85 | japan 985
86 | jess 561
87 | jet 223
88 | jo 370
89 | katie 1355
90 | kb24 215
91 | kenya 11152
92 | korea 515
93 | l 252
94 | latvia 582
95 | ld 63486
96 | ldbitches 1111
97 | lden 2393
98 | ldengirl 652
99 | ldengirls 514
100 | ldenhoy 1895
101 | ldformalaysia 233
102 | ldforsure 513
103 | ldgoldgold 258
104 | ldmedal 8328
105 | ldmedalgame 306
106 | ldmedalist 3350
107 | ldmedalmatch 398
108 | ldmedals 731
109 | ldmedalstamp 354
110 | ldmedalstamps 1051
111 | ldmetal 231
112 | ldorbust 1009
113 | ldpostbox 252
114 | ldrush 2005
115 | lds 227
116 | ldwednesday 9431
117 | lebron 1069
118 | lf 624
119 | lfclap 228
120 | libra 233
121 | lochte 1450
122 | ltu 392
123 | malaysia 9077
124 | matty 287
125 | mexico 1355
126 | mo 9936
127 | mogo 260
128 | mongolia 1673
129 | murray 519
130 | naija 403
131 | ne 334
132 | nieto 241
133 | nigeria 5716
134 | nl 2632
135 | nz 695
136 | od 355
137 | odbye 268
138 | odday 222
139 | odjob 326
140 | odluck 1196
141 | odlucktom 206
142 | odnight 407
143 | odolddays 1925
144 | odtimes 726
145 | odyearformgar 13590
146 | ogle 3787
147 | ogledoodle 853
148 | olympicmas 408
149 | on 202
150 | oner 241
151 | onerontour 300
152 | onjj 204
153 | opals 625
154 | opalsgo 221
155 | osebumps 1272
156 | p 969
157 | pakistan 475
158 | paralympicsgb 1128
159 | ph 2716
160 | phelps 2270
161 | philippines 1604
162 | pilipinas 215
163 | pinas 340
164 | poland 575
165 | puertorico 753
166 | pursuit 337
167 | qatar 1077
168 | rgeous 513
169 | rin 21317
170 | roger 255
171 | rsa 247
172 | russia 2093
173 | sa 10801
174 | sally 310
175 | samsung 208
176 | scotland 203
177 | serbia 303
178 | sheikie 247
179 | singapore 785
180 | skank 230
181 | somalia 324
182 | southafrica 717
183 | spain 550
184 | sprint 227
185 | ssip 1072
186 | supermodel 653
187 | sweden 206
188 | tea 3314
189 | tn 764
190 | tom 2335
191 | turkey 391
192 | twin 352
193 | u 488
194 | ud 558
195 | uganda 728
196 | uk 232
197 | us 545
198 | usa 203459
199 | usabasketball 265
200 | ve 302
201 | wiggo 544
202 | wor 274
203 | world 583
204 | yorkshire 729
205 | zimbabwe 286
206 |
--------------------------------------------------------------------------------
/HashtagAnalysis/src/HMapper.java:
--------------------------------------------------------------------------------
1 | import java.io.IOException;
2 |
3 | import org.apache.commons.lang.StringUtils;
4 | import org.apache.hadoop.io.IntWritable;
5 | import org.apache.hadoop.io.Text;
6 | import org.apache.hadoop.mapreduce.Mapper;
7 |
8 | import java.util.regex.Matcher;
9 | import java.util.regex.Pattern;
10 |
11 | public class HMapper extends Mapper