find book on worldcat

2019-05-02 23:13:28 +02:00 · 2019-05-02 23:13:28 +02:00 · 48ddeba22c
commit 48ddeba22c
parent 6a60f925a4
1 changed files with 60 additions and 7 deletions
--- a/logbot.py
+++ b/logbot.py
@ -14,7 +14,7 @@ import ssl, os, requests, urllib

 class MUCBot(slixmpp.ClientXMPP):
 	"""
-	A simple Slixmpp bot that will save images 
+	A simple Slixmpp bot that will save images
 	and messages that are marked with @bot to a folder.
 	"""

@ -55,7 +55,7 @@ class MUCBot(slixmpp.ClientXMPP):

 	def muc_message(self, msg):
 		# Some inspection commands
-		# print('Message: {}'.format(msg))
+		print('Message: {}'.format(msg))

 		# Always check that a message is not the bot itself, otherwise you will create an infinite loop responding to your own messages.
 		if msg['mucnick'] != self.nick:
@ -72,13 +72,13 @@ class MUCBot(slixmpp.ClientXMPP):
 				self.send_message(mto=self.room,
 								  mbody="Super, our log is growing. Your image is added!",
 								  mtype='groupchat')
-				
+
 				# Save the image to the output folder
 				url = msg['oob']['url'] # grep the url in the message
 				filename = os.path.basename(url) # grep the filename in the url
 				output_path = os.path.join(self.output, filename)
 				u = urllib.request.urlopen(url) # read the image data
-				f = open(output_path, 'wb') # open the output file 
+				f = open(output_path, 'wb') # open the output file
 				f.write(u.read()) # write image to file
 				f.close() # close the output file

@ -107,6 +107,60 @@ class MUCBot(slixmpp.ClientXMPP):
 				f.write(message+'\n')
 				f.close()

+				if '/book' in msg['body']: # Check if this is a book
+
+					self.send_message(mto=self.room,
+									  mbody="Oh a book, that's cool! Thanks {}!".format(msg['mucnick']),
+									  mtype='groupchat')
+
+
+				from bs4 import BeautifulSoup
+				import requests
+				import re
+
+				book = msg['body'].replace('@bot', '').replace('/book', '')
+				book = re.sub(' +', ' ', book) # remove double spaces
+				book = book.lstrip().rstrip() # remove spaces at the beginning and at the end
+				book = book.replace(' ', '+').lower() # turn space into + and lowercase
+
+				page_link = 'https://www.worldcat.org/search?q={}&qt=results_page'.format(book)
+
+				page_response = requests.get(page_link, timeout=5)
+
+				page_content = BeautifulSoup(page_response.content, "html.parser")
+
+				try:
+					book_title = page_content.findAll("div", {"class": "name"})[0].text
+					book_author = page_content.findAll("div", {"class": "author"})[0].text
+					book_publisher = page_content.findAll("div", {"class": "publisher"})[0].text
+
+					response = '<b>BOOK</b>: ' + book_title + ' ' + book_author + ' ' + book_publisher
+
+					book_found = True
+
+				except IndexError:
+
+					book_found = False
+
+				if book_found:
+
+					# Add message to log
+					message = '<b>BOOK</b>: ' + book_title + ' ' + book_author + ' ' + book_publisher
+					log = 'log.html'
+					log_path = os.path.join(self.output, log)
+					f = open(log_path, 'a+')
+					f.write(message+'\n')
+					f.close()
+
+					self.send_message(mto=self.room, mbody='Hope this was the book you were looking for: ' + book_title + ' ' + book_author + ' ' + book_publisher, mtype='groupchat')
+
+				else:
+
+					self.send_message(mto=self.room, mbody='Sorry, no book found!', mtype='groupchat')
+
+
+
+
 if __name__ == '__main__':
 	# Setup the command line arguments.
 	parser = ArgumentParser()
@ -130,8 +184,8 @@ if __name__ == '__main__':
 						help="MUC nickname")

 	# output folder for images
-	parser.add_argument("-o", "--output", dest="output", 
-						help="output folder, this is where the files are stored", 
+	parser.add_argument("-o", "--output", dest="output",
+						help="output folder, this is where the files are stored",
 						type=str)

 	args = parser.parse_args()
@ -163,4 +217,3 @@ if __name__ == '__main__':
 	# Connect to the XMPP server and start processing XMPP stanzas.
 	xmpp.connect()
 	xmpp.process()
-