├── spider
    ├── Readme.md
    ├── settings.py
    └── main.py
├── beforeact.py
├── dayscats.pickle
├── tweetit.py
├── README.md
├── update.py
└── postlog.log


/spider/Readme.md:
--------------------------------------------------------------------------------
1 | This is the spider written in Dragline in order to fetch the quotes from a well known website.


--------------------------------------------------------------------------------
/spider/settings.py:
--------------------------------------------------------------------------------
 1 | SPIDER = {
 2 | 
 3 | }
 4 | 
 5 | REQUEST = {
 6 | 
 7 | }
 8 | 
 9 | CRAWL = {
10 |     "RESUME": False
11 | }
12 | 


--------------------------------------------------------------------------------
/beforeact.py:
--------------------------------------------------------------------------------
 1 | #Code for setting all intial values in a proper manner to start bot
 2 | import redis
 3 | import pickle
 4 | from pymongo import MongoClient
 5 | import datetime
 6 | 
 7 | #creating mongoclient where quotes are stored in my db
 8 | mydb = MongoClient('localhost')['goodread'] 
 9 | 
10 | #Create a redis instance
11 | red = redis.Redis()
12 | red.set('per_day',120)
13 | red.set('today_balance',0)
14 | red.set('today_or_yesterday',datetime.datetime.today().timetuple().tm_mday)
15 | 
16 | #Storing category names in redis for future use
17 | for i in mydb.collection_names():
18 | 	if i!='system.indexes':
19 | 		for cur in mydb[i].find():
20 | 			red.sadd(i,str(cur['_id']))
21 | 		red.sadd('cats',i)
22 | 
23 | #Creating a dictionary for mapping category to day in a month
24 | days_cats = {i+1:k for i,k in enumerate(red.smembers('cats'))}
25 | 
26 | #Writing that mapping to a pickle file 
27 | with open('dayscats.pickle','wb') as f:
28 | 	pickle.dump(days_cats,f)
29 | 
30 | 
31 | 


--------------------------------------------------------------------------------
/dayscats.pickle:
--------------------------------------------------------------------------------
 1 | (dp0
 2 | I1
 3 | S'art'
 4 | p1
 5 | sI2
 6 | S'humour'
 7 | p2
 8 | sI3
 9 | S'quotes'
10 | p3
11 | sI4
12 | S'books'
13 | p4
14 | sI5
15 | S'politics'
16 | p5
17 | sI6
18 | S'love'
19 | p6
20 | sI7
21 | S'happiness'
22 | p7
23 | sI8
24 | S'relationships'
25 | p8
26 | sI9
27 | S'funny'
28 | p9
29 | sI10
30 | S'death'
31 | p10
32 | sI11
33 | S'humor'
34 | p11
35 | sI12
36 | S'inspiration'
37 | p12
38 | sI13
39 | S'god'
40 | p13
41 | sI14
42 | S'poetry'
43 | p14
44 | sI15
45 | S'writing'
46 | p15
47 | sI16
48 | S'romance'
49 | p16
50 | sI17
51 | S'religion'
52 | p17
53 | sI18
54 | S'reading'
55 | p18
56 | sI19
57 | S'war'
58 | p19
59 | sI20
60 | S'hope'
61 | p20
62 | sI21
63 | S'life'
64 | p21
65 | sI22
66 | S'inspirational'
67 | p22
68 | sI23
69 | S'inspirational-quotes'
70 | p23
71 | sI24
72 | S'philosophy'
73 | p24
74 | sI25
75 | S'wisdom'
76 | p25
77 | sI26
78 | S'women'
79 | p26
80 | sI27
81 | S'faith'
82 | p27
83 | sI28
84 | S'success'
85 | p28
86 | sI29
87 | S'science'
88 | p29
89 | sI30
90 | S'truth'
91 | p30
92 | sI31
93 | S'friendship'
94 | p31
95 | s.


--------------------------------------------------------------------------------
/tweetit.py:
--------------------------------------------------------------------------------
 1 | 
 2 | import tweepy
 3 | 
 4 | #NPG class deals with all housekeeping for creating instances.
 5 | class Tweet:
 6 | 	def __init__(self):
 7 | 		self.auth = tweepy.OAuthHandler(self.consumer_key,self.consumer_secret)
 8 | 		self.auth.set_access_token(self.access_token, self.access_token_secret)
 9 | 		self.handle = tweepy.API(self.auth)
10 | 
11 | 	def get_handle(self):
12 | 		return self.handle
13 | 
14 | 	def hitme(self,str):
15 | 		self.handle.update_status(str)
16 | 		print 'posted succesfully'
17 | 
18 | 	def hit_with_image(self,fil,status=None):
19 | 		self.handle.update_with_media(fil,status=status)
20 | 		print 'Done successfully'
21 | 
22 | 	def rehit(self,str):
23 | 		self.handle.retweet(str)
24 | 		print 'Done successfully'
25 | 
26 | 
27 | 
28 | class QUOTE(Tweet):
29 | 	#My Twitter consumer key
30 | 	
31 | 	consumer_key='HHHHHHHHHHHHHHHHHHHHHHH'
32 | 	
33 | 	#My consumer secret
34 | 	
35 | 	consumer_secret='IIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIIII'
36 | 	
37 | 	#My access token
38 | 	access_token='DDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDDD'
39 | 	
40 | 	#My access token secret
41 | 	access_token_secret='EEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEE'
42 | 
43 | 


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
 1 | Quotebot
 2 | ========
 3 | 
 4 | A twitter bot that posts Famous quotes every day on Twitter without intervention of a human operator. 
 5 | The main difference between this bot and others is data posted is purely fetched by Spiders and stored in
 6 | MongoDB.
 7 | 
 8 | Twitter allows only 140 characters length of text,but quotes can be much longer.Inorder to overcome that issue ,if quote is converted into image it can be uploaded as a media file and serves the purpose.
 9 | 
10 | So this project uses an API for converting text to Image,and then uploads it to Twitter.
11 | 
12 | Quotes will have the subject according to day in a month,means every 2nd of month Love Quotes will be posted,
13 | 3rd Inspiration quotes,etc.Daily Maximum 120 Quotes will be posted at maximum.For every 5 minutes,bot checks the
14 | connection automatically when system is active and posts the Quote image.
15 | 
16 | Two APIs Twitter API,Img4free API are used to achieve the task.  
17 | 
18 | tweetit.py creates a class for encapsulating user details.
19 | beforeact.py do all housekeeping task and sets every thing ready for Quotebot to run.
20 | dayscats.pickle consists of mapping of month day -> category.
21 | 
22 | postlog.log stores all logs of posted quotes and also network statistics
23 | 


--------------------------------------------------------------------------------
/spider/main.py:
--------------------------------------------------------------------------------
 1 | #!/usr/bin/env python
 2 | from pymongo import MongoClient
 3 | from dragline.runner import main
 4 | from dragline.htmlparser import HtmlParser
 5 | from dragline.http import Request
 6 | import settings
 7 | 
 8 | 
 9 | class Spider:
10 |     mydb = MongoClient(host ="localhost")["goodread"]
11 |     
12 |     def __init__(self, conf):
13 |         self.name = "brainy"
14 |         self.start = "https://www.goodreads.com/quotes"
15 |         self.allowed_domains = ["www.goodreads.com"]
16 |         self.conf = conf
17 | 
18 |     def parse(self,response):
19 |         parser = HtmlParser(response)
20 |         for url in parser.extract_urls('//a[@class="actionLinkLite serif"]'):
21 |             dbname = url.split('/')[-1]
22 |             yield Request(url,callback="parseCat",meta={'u':dbname})
23 | 
24 | 
25 |     def parseCat(self, response):
26 |         parser = HtmlParser(response)
27 |         dbname= response.meta['u']
28 |         if not  parser.xpath('//a[@class="next_page"]'):
29 |             for i in parser.xpath('//div[@class="quoteText"]'):
30 |                 quote = i.text
31 |                 for j in i.iterfind('a'):
32 |                     author=j.text
33 |                 self.mydb[dbname].insert({'quote':quote,'author':author})
34 |         else:
35 |             for i in parser.xpath('//div[@class="quoteText"]'):
36 |                 quote = i.text
37 |                 for j in i.iterfind('a'):
38 |                     author=j.text
39 |                 self.mydb[dbname].insert({'quote':quote,'author':author})
40 |             
41 |             for url in parser.extract_urls('//a[@class="next_page"]'):
42 |                 yield Request(url,callback="parseCat",meta={'u':dbname})
43 | 
44 | if __name__ == '__main__':
45 |     main(Spider, settings)
46 | 


--------------------------------------------------------------------------------
/update.py:
--------------------------------------------------------------------------------
 1 | '''
 2 | The heart of the QuoteBot
 3 | Here goes the actual thing.The tasks done here in following manner
 4 | 1)Check the post limit
 5 | 2)Fetch quote from database
 6 | 3)Convert it into image(.png) using API 
 7 | 4)Upload it to twitter
 8 | 
 9 | '''
10 | 
11 | #Imports for tweet and store
12 | 
13 | from tweetit import QUOTE
14 | 
15 | import datetime
16 | 
17 | from beforeact import red,mydb
18 | 
19 | import pickle,sys
20 | 
21 | from bson import ObjectId
22 | 
23 | import logging,requests
24 | 
25 | logging.basicConfig(filename='postlog.log',level=logging.DEBUG)
26 | 
27 | days_cats = pickle.load(open('dayscats.pickle','r'))
28 | 
29 | quote = QUOTE()
30 | 
31 | #credentials to be changed
32 | qhandle = quote.get_handle()
33 | 
34 | def return_date():
35 | 	day_of_month = datetime.datetime.today().timetuple().tm_mday
36 | 	return day_of_month
37 | 
38 | def today_category():
39 | 	day = return_date()
40 | 	return days_cats[day]
41 | 
42 | #Creating categories set in redis which is used to Implement day category
43 | def generate_quote_image(qs,qid):
44 | 	payload = {'text':qs,'font':'arial','color':'000000','size':20,'bcolor':'FFFFFF','type':'png'}
45 | 	result1 = requests.get('http://api.img4me.com',params=payload)
46 | 	result2 = requests.get(result1.text.encode('utf-8'))
47 | 	with open(qid+'.png','wb') as f:
48 | 		f.write(result2.content)
49 | 	return qid+'.png'
50 | 
51 | 
52 | def give_quote():
53 | 	quote_id = red.spop(today_category())
54 | 	quote = (mydb[today_category()].find_one({'_id':ObjectId(quote_id)})['quote'].lstrip()).rstrip()
55 | 	author = mydb[today_category()].find_one({'_id':ObjectId(quote_id)})['author']
56 | 	message = quote+'\n---\n'+author
57 | 	try:
58 | 		filename = generate_quote_image(message,quote_id)
59 | 	except:
60 | 		red.sadd(today_category,details[quote_id])
61 | 		sys.exit()
62 | 	return locals()
63 | 
64 | def do_status():
65 | 	details = give_quote()
66 | 	try:
67 | 		qhandle.update_with_media(details['filename'])
68 | 		red.sadd('O'+today_category(),details['quote_id'])
69 | 		red.incr('today_balance')
70 | 	except:
71 | 		red.sadd(today_category,details[quote_id])
72 | 		sys.exit()
73 | 
74 | #Main program which runs the 
75 | def run_it():
76 | 	#Stop posting if count is greater than 120
77 | 	if int(red.get('today_balance'))<int(red.get('per_day')) and int(red.get('today_or_yesterday')) == int(return_date()):
78 | 		do_status()
79 | 		logging.debug('Posted at %s'%(datetime.date.today().ctime()))
80 | 	elif red.get('today_or_yesterday') != return_date():
81 | 		red.set('today_balance',0)
82 | 		red.set('today_or_yesterday',return_date())
83 | 	else:
84 | 		sys.exit()
85 | 
86 | if __name__ == '__main__':
87 | 	run_it()
88 | 
89 | 
90 | 
91 | 
92 | 


--------------------------------------------------------------------------------
/postlog.log:
--------------------------------------------------------------------------------
 1 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): api.img4me.com
 2 | DEBUG:requests.packages.urllib3.connectionpool:"GET /?color=000000&text=%E2%80%9CLore+is+my+favorite+kind+of+story.+Because+it%27s+not+only+historical%2C+it%27s+a+lie+everyone+knows+is+a+lie+but+tells+anyway.+I+love+that.+Of+course+every+story+I+tell+is+true.+Completely+true.+Completely+and+utterly+at+least+five-eighths+of+the+way+to+being+true%2C+which+is+truer+than+any+piece+of+lore+and+truer+than+most+truths+you%27ll+hear.%E2%80%9D%0A---%0AKevin+Sampsell+editor+%22Shanghaied%22+by+Gigi+Little&bcolor=FFFFFF&font=arial&type=png&size=20 HTTP/1.1" 200 None
 3 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): api.img4me.com
 4 | DEBUG:requests.packages.urllib3.connectionpool:"GET /?color=000000&text=%E2%80%9CThere+are+many+things+which+can+not+be+expressed+by+words.%0A---%0AToba+Beta&bcolor=FFFFFF&font=arial&type=png&size=20 HTTP/1.1" 200 None
 5 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): api.img4me.com
 6 | DEBUG:requests.packages.urllib3.connectionpool:"GET /?color=000000&text=%E2%80%9CA+disciple%3A+I+am+worried+about+human+suffering+all+over+the+world.+What+is+the+solution%3FSpiritual+leader%3A+The+solution+to+our+miseries+lie+within+central+atom+of+our+being%2C+%E2%80%98I%E2%80%99.+Once+this+central+atom+transcends+to+%E2%80%98WE%E2%80%99%2C+human+sufferings+can+be+resolved.%E2%80%9D%0A---%0ASantosh+Kalwar&bcolor=FFFFFF&font=arial&type=png&size=20 HTTP/1.1" 200 None
 7 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): api.img4me.com
 8 | DEBUG:requests.packages.urllib3.connectionpool:"GET /?color=000000&text=%E2%80%9CWe%E2%80%99re+fine.%E2%80%99%0A---%0ARick+Riordan&bcolor=FFFFFF&font=arial&type=png&size=20 HTTP/1.1" 200 None
 9 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): img4me.com
10 | DEBUG:requests.packages.urllib3.connectionpool:"GET /HMSUa.png HTTP/1.1" 200 3641
11 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): api.img4me.com
12 | DEBUG:requests.packages.urllib3.connectionpool:"GET /?color=000000&text=%E2%80%9CWorship+your+body%2C+beauty%2C+and+sexual+allure+and+you+will+die+a+million+deaths+before+they+finally+grieve+you.%E2%80%9D%0A---%0ADavid+Foster+Wallace&bcolor=FFFFFF&font=arial&type=png&size=20 HTTP/1.1" 200 None
13 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): img4me.com
14 | DEBUG:requests.packages.urllib3.connectionpool:"GET /2kY.png HTTP/1.1" 200 13833
15 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): api.img4me.com
16 | DEBUG:requests.packages.urllib3.connectionpool:"GET /?color=000000&text=%E2%80%9CWhen+you+are+beloved+and+express+gratitude+like+the+fragrance+of+a+beautiful+flower%2C+you+are+happy.%E2%80%9D%0A---%0ADebasish+Mridha&bcolor=FFFFFF&font=arial&type=png&size=20 HTTP/1.1" 200 None
17 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): img4me.com
18 | DEBUG:requests.packages.urllib3.connectionpool:"GET /nv5XV.png HTTP/1.1" 200 12935
19 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): api.img4me.com
20 | DEBUG:requests.packages.urllib3.connectionpool:"GET /?color=000000&text=%E2%80%9CCressida%3A+My+lord%2C+will+you+be+true%3F%0A---%0AWilliam+Shakespeare&bcolor=FFFFFF&font=arial&type=png&size=20 HTTP/1.1" 200 None
21 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): img4me.com
22 | DEBUG:requests.packages.urllib3.connectionpool:"GET /x3YD.png HTTP/1.1" 200 7741
23 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): api.img4me.com
24 | DEBUG:requests.packages.urllib3.connectionpool:"GET /?color=FFFFE0&text=%E2%80%9CA+PRIME+TRUTH+-+MAN+IS+SELFISH%0A---%0AWilliam+J.+Federer&bcolor=32CD32&font=arial&type=png&size=20 HTTP/1.1" 200 None
25 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): img4me.com
26 | DEBUG:requests.packages.urllib3.connectionpool:"GET /rbUxwwTk.png HTTP/1.1" 200 6165
27 | DEBUG:root:Posted at Sun Nov 30 00:00:00 2014
28 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): api.img4me.com
29 | DEBUG:requests.packages.urllib3.connectionpool:"GET /?color=000000&text=%E2%80%9CExperience+has+taught+us+that+we+have+only+one+enduring+weapon+in+our+struggle+against+mental+illness%3A+the+emotional+discovery+and+emotional+acceptance+of+the+truth+in+the+individual+and+unique+history+of+our+childhood.%E2%80%9D%0A---%0AAlice++Miller&bcolor=FFFFFF&font=arial&type=png&size=20 HTTP/1.1" 200 None
30 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): img4me.com
31 | DEBUG:requests.packages.urllib3.connectionpool:"GET /Qf9pK.png HTTP/1.1" 200 18340
32 | DEBUG:root:Posted at Sun Nov 30 00:00:00 2014
33 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): api.img4me.com
34 | DEBUG:requests.packages.urllib3.connectionpool:"GET /?color=000000&text=%E2%80%9CSometimes+what+we+want+isn%27t+what+we+need.%E2%80%9D%0A---%0AGena+Showalter&bcolor=FFFFFF&font=arial&type=png&size=20 HTTP/1.1" 200 None
35 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): img4me.com
36 | DEBUG:requests.packages.urllib3.connectionpool:"GET /CWqRMmF.png HTTP/1.1" 200 7089
37 | DEBUG:root:Posted at Sun Nov 30 00:00:00 2014
38 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): api.img4me.com
39 | DEBUG:requests.packages.urllib3.connectionpool:"GET /?color=000000&text=%E2%80%9CTo+love+someone+with+all+of+your+heart+requires+reaching+them+where+they+are+with+the+only+words+they+can+understand.%E2%80%9D%0A---%0AShannon+L.+Alder&bcolor=FFFFFF&font=arial&type=png&size=20 HTTP/1.1" 200 None
40 | INFO:requests.packages.urllib3.connectionpool:Starting new HTTP connection (1): img4me.com
41 | DEBUG:requests.packages.urllib3.connectionpool:"GET /CFiVqqkP.png HTTP/1.1" 200 12928
42 | DEBUG:root:Posted at Sun Nov 30 00:00:00 2014
43 | 


--------------------------------------------------------------------------------