diff --git a/xmpp-channels/jargon.py b/xmpp-channels/jargon.py new file mode 100644 index 0000000..e95ad77 --- /dev/null +++ b/xmpp-channels/jargon.py @@ -0,0 +1,65 @@ +#!/usr/bin/env python3 +import os, requests, urllib, subprocess +from bs4 import BeautifulSoup + +def pandoc (src, fro="markdown", to="html5"): + # print ("[pandoc]", file=sys.stderr) + p = subprocess.Popen(["pandoc", "--from", fro, "--to", to, "--section-divs"], stdin=subprocess.PIPE, stdout=subprocess.PIPE, stderr=subprocess.PIPE) + stdout, stderr = p.communicate(src.encode("utf-8")) + return stdout.decode("utf-8") + + +def read_jargon_dictionary(url): + data = urllib.request.urlopen(url).read() #bytes object + # print('data', type(data), data) + string = data.decode("utf-8") + # print("string", type(string), string) + # print () + # html = markdown(string) + html = pandoc(string) # convert from markdown to html + # print("html", html) + + soup = BeautifulSoup(html, features="html5lib") + # headers = soup.find_all('section', {"class": "level1"}) + # print("headers", headers) + + defs = {} # creating empty dictionary + for section in soup.find_all('section', {"class": "level1"}): + h = section.find("h1") + word = h.text # TCP + d = section.find("p") + if not d: + d = section.find("ul") + # print("found",h.text,d.text) + #if d: + #defition = + #store the definition in the dict... + # print ("i am in a loop with a variable header", type(header), header.text) + defs[word.upper()] ={'name': word, 'text': d.text} # add to dictionary word(key): d.text (value) + + + return defs + +if __name__ == "__main__": + # this only happens when you type python read.py + # NOT when this file is imported + url = "https://pad.xpub.nl/p/jargon-file.test/export/txt" + defs = read_jargon_dictionary(url) + print ("OUR JARGON DICTIONARY") + from pprint import pprint + pprint(defs) + # print(defs["UDP"]) + +# cmd = '#TCP' +# query = cmd.replace('#','') +# for header in soup('h1'): +# if query in header.string: +# print(header.string) +# print('---') + +# cmd = '#UDP' +# query = cmd.replace('#','') +# for header in soup('h1'): +# if query in header.string: +# print(header.string) +# print('---') \ No newline at end of file diff --git a/xmpp-channels/listenbot.py b/xmpp-channels/listenbot.py new file mode 100755 index 0000000..caa9ffd --- /dev/null +++ b/xmpp-channels/listenbot.py @@ -0,0 +1,190 @@ +#!/usr/bin/env python3 +# -*- coding: utf-8 -*- + +""" + Slixmpp: The Slick XMPP Library + Copyright (C) 2010 Nathanael C. Fritz + This file is part of Slixmpp. + + See the file LICENSE for copying permission. +""" + +# Code source: https://git.poez.io/slixmpp/tree/examples/muc.py + +# To run this bot: +# $ python3 streambot.py --jid username@yourdomainname.ext --password password --room channel@groups.domainname.ext --nick nickname --output ./output/ + + +import logging +from getpass import getpass +from argparse import ArgumentParser + +import slixmpp +import ssl, os, requests, urllib, re + +from jargon import * + +class MUCBot(slixmpp.ClientXMPP): + """ + A simple Slixmpp bot that will save images + and messages that are marked with #publish to a folder. + """ + + def __init__(self, jid, password, room, nick, output): + slixmpp.ClientXMPP.__init__(self, jid, password) + + self.room = room + self.nick = nick + self.output = output + + # The session_start event will be triggered when + # the bot establishes its connection with the server + # and the XML streams are ready for use. We want to + # listen for this event so that we we can initialize + # our roster. + self.add_event_handler("session_start", self.start) + + # The groupchat_message event is triggered whenever a message + # stanza is received from any chat room. If you also also + # register a handler for the 'message' event, MUC messages + # will be processed by both handlers. + self.add_event_handler("groupchat_message", self.muc_message) + + + def start(self, event): + """ + Process the session_start event. + + Typical actions for the session_start event are + requesting the roster and broadcasting an initial + presence stanza. + """ + + self.get_roster() + self.send_presence() + + # https://xmpp.org/extensions/xep-0045.html + self.plugin['xep_0045'].join_muc(self.room, + self.nick, + # If a room password is needed, use: + # password=the_room_password, + wait=True) + + def muc_message(self, msg): + """ + Process incoming message stanzas from any chat room. Be aware + that if you also have any handlers for the 'message' event, + message stanzas may be processed by both handlers, so check + the 'type' attribute when using a 'message' event handler. + + Whenever the bot's nickname is mentioned, respond to + the message. + + IMPORTANT: Always check that a message is not from yourself, + otherwise you will create an infinite loop responding + to your own messages. + + This handler will reply to messages that mention + the bot's nickname. + + Arguments: + msg -- The received message stanza. See the documentation + for stanza objects and the Message stanza to see + how it may be used. + """ + + # Some inspection commands + # print('Message:{}'.format(msg)) + # print('\nMessage TYPE:{}'.format(msg['type'])) + # print('\nMessage body:{}'.format(msg['body'])) + # print('\nMessage OOB:{}'.format(msg['oob'])) + # print('\nMessage OOB URL:{}'.format(msg['oob']['url'])) + # print('\nMessage MUCK NICK:{}'.format(msg['mucnick'])) + + # Always check that a message is not the bot itself, otherwise you will create an infinite loop responding to your own messages. + if msg['mucnick'] != self.nick: + + # Check if an OOB URL is included in the stanza (which is how an image is sent) + # (OOB object - https://xmpp.org/extensions/xep-0066.html#x-oob) + + + # Include messages in the stream (only when '#publish' is used in the message) + #if '#publish' in msg['body']: + + # reply from the bot +# print(defs.keys()) + + # body_list = re.findall('\w+', msg['body']) #.split(" ") + # print(body_list) + for key in defs.keys(): # for each word written by XMPP user + if key in msg['body'].upper(): # check whether any word is a key of defs + definition = defs[key]['text'] + name = defs[key]['name'] + print(name, definition) + + self.send_message(mto=msg['from'].bare, + mbody="{}: {}".format(name,definition), + mtype='groupchat') + + + +if __name__ == '__main__': + # Setup the command line arguments. + parser = ArgumentParser() + + # output verbosity options. + parser.add_argument("-q", "--quiet", help="set logging to ERROR", + action="store_const", dest="loglevel", + const=logging.ERROR, default=logging.INFO) + parser.add_argument("-d", "--debug", help="set logging to DEBUG", + action="store_const", dest="loglevel", + const=logging.DEBUG, default=logging.INFO) + + # JID and password options. + parser.add_argument("-j", "--jid", dest="jid", default="pe@please.undo.undo.it", + help="JID to use") + parser.add_argument("-p", "--password", dest="password", default="xpub", + help="password to use") + parser.add_argument("-r", "--room", dest="room", default="xpub@muc.vvvvvvaria.org", + help="MUC room to join") + parser.add_argument("-n", "--nick", dest="nick", default="jargonbot", + help="MUC nickname") + + # output folder for images + parser.add_argument("-o", "--output", dest="output", + help="output folder, this is where the files are stored", + default="./output/", type=str) + + args = parser.parse_args() + + # get the jargon defs dictionary + url = "https://pad.xpub.nl/p/jargon-file.test/export/txt" + defs = read_jargon_dictionary(url) + # Setup logging. + logging.basicConfig(level=args.loglevel, + format='%(levelname)-8s %(message)s') + + if args.jid is None: + args.jid = input("User: ") + if args.password is None: + args.password = getpass("Password: ") + if args.room is None: + args.room = input("MUC room: ") + if args.nick is None: + args.nick = input("MUC nickname: ") + if args.output is None: + args.output = input("Output folder: ") + + # Setup the MUCBot and register plugins. Note that while plugins may + # have interdependencies, the order in which you register them does + # not matter. + xmpp = MUCBot(args.jid, args.password, args.room, args.nick, args.output) + xmpp.register_plugin('xep_0030') # Service Discovery + xmpp.register_plugin('xep_0045') # Multi-User Chat + xmpp.register_plugin('xep_0199') # XMPP Ping + xmpp.register_plugin('xep_0066') # Process URI's (files, images) + + # Connect to the XMPP server and start processing XMPP stanzas. + xmpp.connect() + xmpp.process() +