merge jargon branch to merge
#1
Merged
onebigear
merged 1 commits from jargonbot
into master
6 years ago
@ -0,0 +1,65 @@
|
||||
#!/usr/bin/env python3
|
||||
import os, requests, urllib, subprocess
|
||||
from bs4 import BeautifulSoup
|
||||
|
||||
def pandoc (src, fro="markdown", to="html5"):
|
||||
# print ("[pandoc]", file=sys.stderr)
|
||||
p = subprocess.Popen(["pandoc", "--from", fro, "--to", to, "--section-divs"], stdin=subprocess.PIPE, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
|
||||
stdout, stderr = p.communicate(src.encode("utf-8"))
|
||||
return stdout.decode("utf-8")
|
||||
|
||||
|
||||
def read_jargon_dictionary(url):
|
||||
data = urllib.request.urlopen(url).read() #bytes object
|
||||
# print('data', type(data), data)
|
||||
string = data.decode("utf-8")
|
||||
# print("string", type(string), string)
|
||||
# print ()
|
||||
# html = markdown(string)
|
||||
html = pandoc(string) # convert from markdown to html
|
||||
# print("html", html)
|
||||
|
||||
soup = BeautifulSoup(html, features="html5lib")
|
||||
# headers = soup.find_all('section', {"class": "level1"})
|
||||
# print("headers", headers)
|
||||
|
||||
defs = {} # creating empty dictionary
|
||||
for section in soup.find_all('section', {"class": "level1"}):
|
||||
h = section.find("h1")
|
||||
word = h.text # TCP
|
||||
d = section.find("p")
|
||||
if not d:
|
||||
d = section.find("ul")
|
||||
# print("found",h.text,d.text)
|
||||
#if d:
|
||||
#defition =
|
||||
#store the definition in the dict...
|
||||
# print ("i am in a loop with a variable header", type(header), header.text)
|
||||
defs[word.upper()] ={'name': word, 'text': d.text} # add to dictionary word(key): d.text (value)
|
||||
|
||||
|
||||
return defs
|
||||
|
||||
if __name__ == "__main__":
|
||||
# this only happens when you type python read.py
|
||||
# NOT when this file is imported
|
||||
url = "https://pad.xpub.nl/p/jargon-file.test/export/txt"
|
||||
defs = read_jargon_dictionary(url)
|
||||
print ("OUR JARGON DICTIONARY")
|
||||
from pprint import pprint
|
||||
pprint(defs)
|
||||
# print(defs["UDP"])
|
||||
|
||||
# cmd = '#TCP'
|
||||
# query = cmd.replace('#','')
|
||||
# for header in soup('h1'):
|
||||
# if query in header.string:
|
||||
# print(header.string)
|
||||
# print('---')
|
||||
|
||||
# cmd = '#UDP'
|
||||
# query = cmd.replace('#','')
|
||||
# for header in soup('h1'):
|
||||
# if query in header.string:
|
||||
# print(header.string)
|
||||
# print('---')
|
@ -0,0 +1,190 @@
|
||||
#!/usr/bin/env python3
|
||||
# -*- coding: utf-8 -*-
|
||||
|
||||
"""
|
||||
Slixmpp: The Slick XMPP Library
|
||||
Copyright (C) 2010 Nathanael C. Fritz
|
||||
This file is part of Slixmpp.
|
||||
|
||||
See the file LICENSE for copying permission.
|
||||
"""
|
||||
|
||||
# Code source: https://git.poez.io/slixmpp/tree/examples/muc.py
|
||||
|
||||
# To run this bot:
|
||||
# $ python3 streambot.py --jid username@yourdomainname.ext --password password --room channel@groups.domainname.ext --nick nickname --output ./output/
|
||||
|
||||
|
||||
import logging
|
||||
from getpass import getpass
|
||||
from argparse import ArgumentParser
|
||||
|
||||
import slixmpp
|
||||
import ssl, os, requests, urllib, re
|
||||
|
||||
from jargon import *
|
||||
|
||||
class MUCBot(slixmpp.ClientXMPP):
|
||||
"""
|
||||
A simple Slixmpp bot that will save images
|
||||
and messages that are marked with #publish to a folder.
|
||||
"""
|
||||
|
||||
def __init__(self, jid, password, room, nick, output):
|
||||
slixmpp.ClientXMPP.__init__(self, jid, password)
|
||||
|
||||
self.room = room
|
||||
self.nick = nick
|
||||
self.output = output
|
||||
|
||||
# The session_start event will be triggered when
|
||||
# the bot establishes its connection with the server
|
||||
# and the XML streams are ready for use. We want to
|
||||
# listen for this event so that we we can initialize
|
||||
# our roster.
|
||||
self.add_event_handler("session_start", self.start)
|
||||
|
||||
# The groupchat_message event is triggered whenever a message
|
||||
# stanza is received from any chat room. If you also also
|
||||
# register a handler for the 'message' event, MUC messages
|
||||
# will be processed by both handlers.
|
||||
self.add_event_handler("groupchat_message", self.muc_message)
|
||||
|
||||
|
||||
def start(self, event):
|
||||
"""
|
||||
Process the session_start event.
|
||||
|
||||
Typical actions for the session_start event are
|
||||
requesting the roster and broadcasting an initial
|
||||
presence stanza.
|
||||
"""
|
||||
|
||||
self.get_roster()
|
||||
self.send_presence()
|
||||
|
||||
# https://xmpp.org/extensions/xep-0045.html
|
||||
self.plugin['xep_0045'].join_muc(self.room,
|
||||
self.nick,
|
||||
# If a room password is needed, use:
|
||||
# password=the_room_password,
|
||||
wait=True)
|
||||
|
||||
def muc_message(self, msg):
|
||||
"""
|
||||
Process incoming message stanzas from any chat room. Be aware
|
||||
that if you also have any handlers for the 'message' event,
|
||||
message stanzas may be processed by both handlers, so check
|
||||
the 'type' attribute when using a 'message' event handler.
|
||||
|
||||
Whenever the bot's nickname is mentioned, respond to
|
||||
the message.
|
||||
|
||||
IMPORTANT: Always check that a message is not from yourself,
|
||||
otherwise you will create an infinite loop responding
|
||||
to your own messages.
|
||||
|
||||
This handler will reply to messages that mention
|
||||
the bot's nickname.
|
||||
|
||||
Arguments:
|
||||
msg -- The received message stanza. See the documentation
|
||||
for stanza objects and the Message stanza to see
|
||||
how it may be used.
|
||||
"""
|
||||
|
||||
# Some inspection commands
|
||||
# print('Message:{}'.format(msg))
|
||||
# print('\nMessage TYPE:{}'.format(msg['type']))
|
||||
# print('\nMessage body:{}'.format(msg['body']))
|
||||
# print('\nMessage OOB:{}'.format(msg['oob']))
|
||||
# print('\nMessage OOB URL:{}'.format(msg['oob']['url']))
|
||||
# print('\nMessage MUCK NICK:{}'.format(msg['mucnick']))
|
||||
|
||||
# Always check that a message is not the bot itself, otherwise you will create an infinite loop responding to your own messages.
|
||||
if msg['mucnick'] != self.nick:
|
||||
|
||||
# Check if an OOB URL is included in the stanza (which is how an image is sent)
|
||||
# (OOB object - https://xmpp.org/extensions/xep-0066.html#x-oob)
|
||||
|
||||
|
||||
# Include messages in the stream (only when '#publish' is used in the message)
|
||||
#if '#publish' in msg['body']:
|
||||
|
||||
# reply from the bot
|
||||
# print(defs.keys())
|
||||
|
||||
# body_list = re.findall('\w+', msg['body']) #.split(" ")
|
||||
# print(body_list)
|
||||
for key in defs.keys(): # for each word written by XMPP user
|
||||
if key in msg['body'].upper(): # check whether any word is a key of defs
|
||||
definition = defs[key]['text']
|
||||
name = defs[key]['name']
|
||||
print(name, definition)
|
||||
|
||||
self.send_message(mto=msg['from'].bare,
|
||||
mbody="{}: {}".format(name,definition),
|
||||
mtype='groupchat')
|
||||
|
||||
|
||||
|
||||
if __name__ == '__main__':
|
||||
# Setup the command line arguments.
|
||||
parser = ArgumentParser()
|
||||
|
||||
# output verbosity options.
|
||||
parser.add_argument("-q", "--quiet", help="set logging to ERROR",
|
||||
action="store_const", dest="loglevel",
|
||||
const=logging.ERROR, default=logging.INFO)
|
||||
parser.add_argument("-d", "--debug", help="set logging to DEBUG",
|
||||
action="store_const", dest="loglevel",
|
||||
const=logging.DEBUG, default=logging.INFO)
|
||||
|
||||
# JID and password options.
|
||||
parser.add_argument("-j", "--jid", dest="jid", default="pe@please.undo.undo.it",
|
||||
help="JID to use")
|
||||
parser.add_argument("-p", "--password", dest="password", default="xpub",
|
||||
help="password to use")
|
||||
parser.add_argument("-r", "--room", dest="room", default="xpub@muc.vvvvvvaria.org",
|
||||
help="MUC room to join")
|
||||
parser.add_argument("-n", "--nick", dest="nick", default="jargonbot",
|
||||
help="MUC nickname")
|
||||
|
||||
# output folder for images
|
||||
parser.add_argument("-o", "--output", dest="output",
|
||||
help="output folder, this is where the files are stored",
|
||||
default="./output/", type=str)
|
||||
|
||||
args = parser.parse_args()
|
||||
|
||||
# get the jargon defs dictionary
|
||||
url = "https://pad.xpub.nl/p/jargon-file.test/export/txt"
|
||||
defs = read_jargon_dictionary(url)
|
||||
# Setup logging.
|
||||
logging.basicConfig(level=args.loglevel,
|
||||
format='%(levelname)-8s %(message)s')
|
||||
|
||||
if args.jid is None:
|
||||
args.jid = input("User: ")
|
||||
if args.password is None:
|
||||
args.password = getpass("Password: ")
|
||||
if args.room is None:
|
||||
args.room = input("MUC room: ")
|
||||
if args.nick is None:
|
||||
args.nick = input("MUC nickname: ")
|
||||
if args.output is None:
|
||||
args.output = input("Output folder: ")
|
||||
|
||||
# Setup the MUCBot and register plugins. Note that while plugins may
|
||||
# have interdependencies, the order in which you register them does
|
||||
# not matter.
|
||||
xmpp = MUCBot(args.jid, args.password, args.room, args.nick, args.output)
|
||||
xmpp.register_plugin('xep_0030') # Service Discovery
|
||||
xmpp.register_plugin('xep_0045') # Multi-User Chat
|
||||
xmpp.register_plugin('xep_0199') # XMPP Ping
|
||||
xmpp.register_plugin('xep_0066') # Process URI's (files, images)
|
||||
|
||||
# Connect to the XMPP server and start processing XMPP stanzas.
|
||||
xmpp.connect()
|
||||
xmpp.process()
|
||||
|
Loading…
Reference in New Issue