2017-09-20 23:25:57 +02:00
|
|
|
#!/usr/bin/env python3
|
2016-11-21 23:04:28 +01:00
|
|
|
# -*- coding: utf-8 -*-
|
2017-09-20 18:26:31 +02:00
|
|
|
import html
|
2016-12-13 21:20:02 +01:00
|
|
|
import logging
|
2016-11-21 23:04:28 +01:00
|
|
|
import re
|
2017-09-20 23:25:57 +02:00
|
|
|
import sys
|
2016-12-13 21:20:02 +01:00
|
|
|
from configparser import ConfigParser
|
2016-12-13 02:15:52 +01:00
|
|
|
from json import loads
|
2016-12-13 21:20:02 +01:00
|
|
|
from urllib.parse import urlparse
|
2016-11-21 23:04:28 +01:00
|
|
|
|
2016-12-13 21:20:02 +01:00
|
|
|
import feedparser
|
|
|
|
import redis
|
2017-09-20 23:25:57 +02:00
|
|
|
import telegram
|
|
|
|
from telegram.ext import CommandHandler, Updater
|
2016-11-21 23:04:28 +01:00
|
|
|
from telegram.ext.dispatcher import run_async
|
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
import utils
|
2016-11-21 23:04:28 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
# Logging
|
|
|
|
logging.basicConfig(
|
|
|
|
format="%(asctime)s - %(levelname)s: %(message)s",
|
|
|
|
datefmt="%d.%m.%Y %H:%M:%S",
|
|
|
|
level=logging.INFO
|
|
|
|
)
|
2016-11-21 23:04:28 +01:00
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
# Bot configuration
|
|
|
|
config = ConfigParser()
|
|
|
|
try:
|
|
|
|
config.read_file(open('config.ini'))
|
|
|
|
except FileNotFoundError:
|
|
|
|
logger.critical('Config.ini nicht gefunden')
|
|
|
|
sys.exit(1)
|
|
|
|
|
|
|
|
# Bot token
|
|
|
|
try:
|
|
|
|
bot_token = config['DEFAULT']['token']
|
|
|
|
except KeyError:
|
|
|
|
logger.error('Kein Bot-Token gesetzt, bitte config.ini prüfen')
|
|
|
|
sys.exit(1)
|
|
|
|
if not bot_token:
|
|
|
|
logger.error('Kein Bot-Token gesetzt, bitte config.ini prüfen')
|
|
|
|
sys.exit(1)
|
|
|
|
|
2016-12-13 02:15:52 +01:00
|
|
|
# Admins
|
2017-09-20 23:25:57 +02:00
|
|
|
try:
|
|
|
|
admins = loads(config["ADMIN"]["id"])
|
|
|
|
except KeyError:
|
|
|
|
logger.error('Keine Admin-IDs gesetzt, bitte config.ini prüfen.')
|
|
|
|
sys.exit(1)
|
2016-12-13 02:15:52 +01:00
|
|
|
if not admins:
|
2017-09-20 23:25:57 +02:00
|
|
|
logger.error('Keine Admin-IDs gesetzt, bitte config.ini prüfen.')
|
|
|
|
sys.exit(1)
|
|
|
|
|
|
|
|
for admin in admins:
|
|
|
|
if not isinstance(admin, int):
|
|
|
|
logger.error('Admin-IDs müssen Integer sein.')
|
|
|
|
sys.exit(1)
|
2016-12-13 02:15:52 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
# Redis
|
|
|
|
redis_conf = config['REDIS']
|
|
|
|
redis_db = redis_conf.get('db', 0)
|
|
|
|
redis_host = redis_conf.get('host', '127.0.0.1')
|
|
|
|
redis_port = redis_conf.get('port', 6379)
|
|
|
|
redis_socket = redis_conf.get('socket_path')
|
2016-11-21 23:04:28 +01:00
|
|
|
if redis_socket:
|
|
|
|
r = redis.Redis(unix_socket_path=redis_socket, db=int(redis_db), decode_responses=True)
|
|
|
|
else:
|
|
|
|
r = redis.Redis(host=redis_host, port=int(redis_port), db=int(redis_db), decode_responses=True)
|
|
|
|
|
|
|
|
if not r.ping():
|
2017-09-20 23:25:57 +02:00
|
|
|
logging.getLogger("Redis").critical("Redis-Verbindungsfehler, config.ini prüfen")
|
|
|
|
sys.exit(1)
|
2016-12-13 21:20:02 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
feed_hash = 'pythonbot:rss:{0}'
|
2016-12-13 21:20:02 +01:00
|
|
|
|
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
@run_async
|
|
|
|
def start(bot, update):
|
|
|
|
if not utils.can_use_bot(update):
|
2016-11-21 23:04:28 +01:00
|
|
|
return
|
2017-09-20 23:25:57 +02:00
|
|
|
update.message.reply_text(
|
|
|
|
text='<b>Willkommen beim RSS-Bot!</b>\nSende /help, um zu starten.',
|
|
|
|
parse_mode=telegram.ParseMode.HTML
|
|
|
|
)
|
2016-12-13 21:20:02 +01:00
|
|
|
|
|
|
|
|
2016-11-21 23:04:28 +01:00
|
|
|
@run_async
|
2017-09-20 23:25:57 +02:00
|
|
|
def help_text(bot, update):
|
|
|
|
if not utils.can_use_bot(update):
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
2017-09-20 23:25:57 +02:00
|
|
|
update.message.reply_text(
|
|
|
|
text='<b>/rss</b> <i>[Chat]</i>: Abonnierte Feeds anzeigen\n'
|
|
|
|
'<b>/sub</b> <i>Feed-URL</i> <i>[Chat]</i>: Feed abonnieren\n'
|
|
|
|
'<b>/del</b> <i>n</i> <i>[Chat]</i>: Feed löschen',
|
|
|
|
parse_mode=telegram.ParseMode.HTML
|
2016-12-13 21:20:02 +01:00
|
|
|
)
|
|
|
|
|
2016-11-21 23:04:28 +01:00
|
|
|
|
|
|
|
@run_async
|
2017-09-20 23:25:57 +02:00
|
|
|
def list_feeds(bot, update, args):
|
|
|
|
if not utils.can_use_bot(update):
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
2017-09-20 23:25:57 +02:00
|
|
|
if args:
|
|
|
|
chat_name = args[0]
|
|
|
|
try:
|
|
|
|
resp = bot.getChat(chat_name)
|
|
|
|
except telegram.error.BadRequest:
|
|
|
|
update.message.reply_text('❌ Dieser Kanal existiert nicht.')
|
|
|
|
return
|
|
|
|
chat_id = str(resp.id)
|
|
|
|
chat_title = resp.title
|
|
|
|
else:
|
|
|
|
chat_id = str(update.message.chat.id)
|
|
|
|
if update.message.chat.type == 'private':
|
|
|
|
chat_title = update.message.chat.first_name
|
|
|
|
else:
|
|
|
|
chat_title = update.message.chat.title
|
|
|
|
|
|
|
|
subs = r.smembers(feed_hash.format(chat_id))
|
|
|
|
if not subs:
|
|
|
|
text = '❌ Keine Feeds abonniert.'
|
|
|
|
else:
|
|
|
|
text = '<b>' + html.escape(chat_title) + '</b> hat abonniert:\n'
|
|
|
|
for n, feed in enumerate(subs):
|
|
|
|
text += '<b>' + str(n + 1) + ')</b> ' + feed + '\n'
|
|
|
|
|
|
|
|
update.message.reply_text(
|
|
|
|
text=text,
|
|
|
|
parse_mode=telegram.ParseMode.HTML
|
2016-12-13 21:20:02 +01:00
|
|
|
)
|
|
|
|
|
2016-11-21 23:04:28 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
@run_async
|
|
|
|
def subscribe(bot, update, args):
|
|
|
|
if not utils.can_use_bot(update):
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
2017-09-20 23:25:57 +02:00
|
|
|
if not args:
|
|
|
|
update.message.reply_text('❌ Keine Feed-URL angegeben.')
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
2016-11-21 23:04:28 +01:00
|
|
|
feed_url = args[0]
|
2017-09-20 23:25:57 +02:00
|
|
|
if not re.match("^http[s]?://(?:[a-zA-Z]|[0-9]|[$-_@.&+]|[!*(),]|(?:%[0-9a-fA-F][0-9a-fA-F]))+$", feed_url):
|
|
|
|
update.message.reply_text('❌ Das ist keine URL.')
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
2016-11-21 23:04:28 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
# Get Chat ID from name if given
|
2016-11-21 23:04:28 +01:00
|
|
|
if len(args) > 1:
|
2017-09-20 23:25:57 +02:00
|
|
|
chat_name = args[1]
|
|
|
|
try:
|
|
|
|
resp = bot.getChat(chat_name)
|
|
|
|
except telegram.error.BadRequest:
|
|
|
|
update.message.reply_text('❌ Dieser Kanal existiert nicht.')
|
|
|
|
return
|
|
|
|
chat_id = str(resp.id)
|
|
|
|
resp = bot.getChatMember(chat_id, bot.id)
|
|
|
|
if resp.status != 'administrator':
|
|
|
|
update.message.reply_text('❌ Bot ist kein Administrator in diesem Kanal.')
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
2016-11-21 23:04:28 +01:00
|
|
|
else:
|
2017-09-20 23:25:57 +02:00
|
|
|
chat_id = str(update.message.chat.id)
|
2016-12-13 21:20:02 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
bot.sendChatAction(update.message.chat.id, action=telegram.ChatAction.TYPING)
|
|
|
|
data = feedparser.parse(feed_url)
|
|
|
|
if 'link' not in data.feed:
|
|
|
|
update.message.reply_text('❌ Kein gültiger Feed.')
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
2017-09-20 23:25:57 +02:00
|
|
|
feed_url = data.href # Follow all redirects
|
|
|
|
if r.sismember(feed_hash.format(chat_id), feed_url):
|
|
|
|
update.message.reply_text('✅ Dieser Feed wurde bereits abonniert.')
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
if 'title' not in data.feed:
|
|
|
|
feed_title = feed_url
|
2016-11-21 23:04:28 +01:00
|
|
|
else:
|
2017-09-20 23:25:57 +02:00
|
|
|
feed_title = html.escape(data.feed['title'])
|
|
|
|
|
|
|
|
# Save the last entry in Redis, if it doesn't exist
|
|
|
|
if data.entries:
|
|
|
|
last_entry_hash = feed_hash.format(feed_url + ':last_entry')
|
|
|
|
if not r.exists(last_entry_hash):
|
|
|
|
if 'id' not in data.entries[0]:
|
|
|
|
last_entry = data.entries[0]['link']
|
|
|
|
else:
|
|
|
|
last_entry = data.entries[0]['id']
|
|
|
|
r.set(last_entry_hash, last_entry)
|
|
|
|
|
|
|
|
r.sadd(feed_hash.format(feed_url + ':subs'), chat_id)
|
|
|
|
r.sadd(feed_hash.format(chat_id), feed_url)
|
|
|
|
update.message.reply_text(
|
|
|
|
text='✅ <b>' + feed_title + '</b> hinzugefügt!',
|
|
|
|
parse_mode=telegram.ParseMode.HTML
|
2016-12-13 21:20:02 +01:00
|
|
|
)
|
|
|
|
|
2016-11-21 23:04:28 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
@run_async
|
|
|
|
def unsubscribe(bot, update, args):
|
|
|
|
if not utils.can_use_bot(update):
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
2017-09-20 23:25:57 +02:00
|
|
|
if not args:
|
|
|
|
update.message.reply_text('❌ Keine Nummer angegeben.')
|
2016-11-21 23:04:28 +01:00
|
|
|
return
|
2016-12-13 21:20:02 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
# Get Chat ID from name if given
|
2016-12-13 21:20:02 +01:00
|
|
|
if len(args) > 1:
|
2017-09-20 23:25:57 +02:00
|
|
|
chat_name = args[1]
|
|
|
|
try:
|
|
|
|
resp = bot.getChat(chat_name)
|
|
|
|
except telegram.error.BadRequest:
|
|
|
|
update.message.reply_text('❌ Dieser Kanal existiert nicht.')
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
2017-09-20 23:25:57 +02:00
|
|
|
chat_id = str(resp.id)
|
2016-11-21 23:04:28 +01:00
|
|
|
else:
|
2017-09-20 23:25:57 +02:00
|
|
|
chat_id = str(update.message.chat.id)
|
2016-12-13 21:20:02 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
try:
|
|
|
|
n = int(args[0])
|
|
|
|
except ValueError:
|
|
|
|
update.message.reply_text('❌ Keine Nummer angegeben.')
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
2017-09-20 23:25:57 +02:00
|
|
|
|
|
|
|
chat_hash = feed_hash.format(chat_id)
|
|
|
|
subs = r.smembers(chat_hash)
|
|
|
|
if n < 1:
|
|
|
|
update.message.reply_text('❌ Nummer muss größer als 0 sein!')
|
|
|
|
return
|
|
|
|
elif n > len(subs):
|
|
|
|
update.message.reply_text('❌ Feed-ID zu hoch.')
|
2016-11-21 23:04:28 +01:00
|
|
|
return
|
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
feed_url = list(subs)[n - 1]
|
|
|
|
sub_hash = feed_hash.format(feed_url + ':subs')
|
|
|
|
r.srem(chat_hash, feed_url)
|
|
|
|
r.srem(sub_hash, chat_id)
|
|
|
|
if not r.smembers(sub_hash): # no one subscribed, remove it
|
|
|
|
r.delete(feed_hash.format(feed_url + ':last_entry'))
|
2016-12-13 21:20:02 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
update.message.reply_text(
|
|
|
|
text='✅ <b>' + feed_url + '</b> entfernt.',
|
|
|
|
parse_mode=telegram.ParseMode.HTML
|
|
|
|
)
|
2016-11-21 23:04:28 +01:00
|
|
|
|
2016-12-13 21:20:02 +01:00
|
|
|
|
|
|
|
@run_async
|
2017-09-20 23:25:57 +02:00
|
|
|
def check_feed(bot, key):
|
2017-09-20 23:29:51 +02:00
|
|
|
feed_url = re.match('^' + feed_hash.format('(.+):subs$'), key).group(1)
|
2017-09-20 23:25:57 +02:00
|
|
|
logger.info(feed_url)
|
|
|
|
data = feedparser.parse(feed_url)
|
|
|
|
if 'link' not in data.feed:
|
|
|
|
logger.warning('Kein gültiger Feed, Status-Code ' + str(data.status))
|
|
|
|
return None
|
|
|
|
if 'title' not in data.feed:
|
|
|
|
feed_title = data.feed['link']
|
2016-11-21 23:04:28 +01:00
|
|
|
else:
|
2017-09-20 23:25:57 +02:00
|
|
|
feed_title = data.feed['title']
|
|
|
|
last_entry_hash = feed_hash.format(feed_url + ':last_entry')
|
|
|
|
last_entry = r.get(last_entry_hash)
|
|
|
|
new_entries = utils.get_new_entries(data.entries, last_entry)
|
|
|
|
for entry in reversed(new_entries):
|
|
|
|
if 'title' not in entry:
|
|
|
|
post_title = 'Kein Titel'
|
2016-12-13 21:20:02 +01:00
|
|
|
else:
|
2017-09-20 23:25:57 +02:00
|
|
|
post_title = html.escape(utils.remove_html_tags(entry['title']).strip())
|
|
|
|
if 'link' not in entry:
|
|
|
|
post_link = entry.link
|
|
|
|
link_name = post_link
|
2016-12-13 02:15:52 +01:00
|
|
|
else:
|
2017-09-20 23:25:57 +02:00
|
|
|
post_link = entry.link
|
|
|
|
feedproxy = re.search('^https?://feedproxy\.google\.com/~r/(.+?)/.*', post_link) # feedproxy.google.com
|
|
|
|
if feedproxy:
|
|
|
|
link_name = feedproxy.group(1)
|
2016-12-13 21:20:02 +01:00
|
|
|
else:
|
2017-09-20 23:25:57 +02:00
|
|
|
link_name = urlparse(post_link).netloc
|
|
|
|
link_name = re.sub('^www\d?\.', '', link_name) # remove www.
|
|
|
|
if 'content' in entry:
|
|
|
|
content = utils.get_content(entry.content[0]['value'])
|
|
|
|
elif 'summary' in entry:
|
|
|
|
content = utils.get_content(entry.summary)
|
|
|
|
else:
|
|
|
|
content = ''
|
|
|
|
text = '<b>{post_title}</b>\n<i>{feed_title}</i>\n{content}'.format(
|
|
|
|
post_title=post_title,
|
|
|
|
feed_title=feed_title,
|
|
|
|
content=content
|
|
|
|
)
|
|
|
|
text += '\n<a href="{post_link}">Auf {link_name} weiterlesen</a>\n'.format(
|
|
|
|
post_link=post_link,
|
|
|
|
link_name=link_name
|
|
|
|
)
|
|
|
|
for member in r.smembers(key):
|
|
|
|
try:
|
|
|
|
bot.sendMessage(
|
|
|
|
chat_id=member,
|
|
|
|
text=text,
|
|
|
|
parse_mode=telegram.ParseMode.HTML,
|
|
|
|
disable_web_page_preview=True
|
|
|
|
)
|
|
|
|
except telegram.error.Unauthorized:
|
|
|
|
logging.warning('Chat ' + member + ' existiert nicht mehr, wird gelöscht.')
|
|
|
|
r.srem(key, member)
|
|
|
|
r.delete(feed_hash.format(member))
|
|
|
|
except telegram.error.ChatMigrated as new_chat:
|
|
|
|
new_chat_id = new_chat.new_chat_id
|
|
|
|
logging.info('Chat migriert: ' + member + ' -> ' + str(new_chat_id))
|
|
|
|
r.srem(key, member)
|
|
|
|
r.sadd(key, new_chat_id)
|
|
|
|
r.rename(feed_hash.format(member), feed_hash.format(new_chat_id))
|
|
|
|
bot.sendMessage(
|
|
|
|
chat_id=member,
|
|
|
|
text=text,
|
|
|
|
parse_mode=telegram.ParseMode.HTML,
|
|
|
|
disable_web_page_preview=True
|
|
|
|
)
|
|
|
|
except telegram.error.TimedOut:
|
|
|
|
pass
|
|
|
|
|
|
|
|
if not r.exists(key):
|
|
|
|
r.delete(last_entry_hash)
|
2016-12-13 21:20:02 +01:00
|
|
|
return
|
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
# Set the new last entry if there are any
|
|
|
|
if new_entries:
|
|
|
|
if 'id' not in new_entries[0]:
|
|
|
|
new_last_entry = new_entries[0].link
|
|
|
|
else:
|
|
|
|
new_last_entry = new_entries[0].id
|
|
|
|
r.set(last_entry_hash, new_last_entry)
|
2016-11-21 23:04:28 +01:00
|
|
|
|
2016-12-13 21:20:02 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
@run_async
|
|
|
|
def run_job(bot, job=None):
|
|
|
|
logger.info('================================')
|
2017-09-20 23:29:51 +02:00
|
|
|
keys = r.keys(feed_hash.format('*:subs'))
|
2017-09-20 23:25:57 +02:00
|
|
|
for key in keys:
|
|
|
|
check_feed(bot, key)
|
2016-11-21 23:04:28 +01:00
|
|
|
|
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
# Main function
|
2016-11-21 23:04:28 +01:00
|
|
|
def main():
|
2017-09-20 23:25:57 +02:00
|
|
|
# Setup the updater and show bot info
|
|
|
|
updater = Updater(token=bot_token)
|
|
|
|
try:
|
|
|
|
bot_info = updater.bot.getMe()
|
|
|
|
except telegram.error.Unauthorized:
|
|
|
|
logger.error('Anmeldung nicht möglich, Bot-Token falsch?')
|
|
|
|
sys.exit(1)
|
|
|
|
|
|
|
|
logger.info('Starte ' + bot_info.first_name + ', AKA @' + bot_info.username + ' (' + str(bot_info.id) + ')')
|
|
|
|
|
|
|
|
# Register Handlers
|
|
|
|
handlers = [
|
|
|
|
CommandHandler('start', start),
|
|
|
|
CommandHandler('help', help_text),
|
|
|
|
CommandHandler('rss', list_feeds, pass_args=True),
|
|
|
|
CommandHandler('sub', subscribe, pass_args=True),
|
|
|
|
CommandHandler('del', unsubscribe, pass_args=True),
|
|
|
|
CommandHandler('sync', run_job)
|
|
|
|
]
|
|
|
|
for handler in handlers:
|
|
|
|
updater.dispatcher.add_handler(handler)
|
|
|
|
|
|
|
|
updater.job_queue.run_repeating(
|
|
|
|
run_job,
|
|
|
|
interval=60.0,
|
|
|
|
first=2.0
|
|
|
|
)
|
2016-11-21 23:04:28 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
# Start this thing!
|
|
|
|
updater.start_polling(
|
|
|
|
clean=True,
|
|
|
|
bootstrap_retries=-1,
|
|
|
|
allowed_updates=["message"]
|
|
|
|
)
|
2016-11-21 23:04:28 +01:00
|
|
|
|
2017-09-20 23:25:57 +02:00
|
|
|
# Run Bot until CTRL+C is pressed or a SIGINIT,
|
|
|
|
# SIGTERM or SIGABRT is sent.
|
2016-11-21 23:04:28 +01:00
|
|
|
updater.idle()
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == '__main__':
|
2016-11-22 19:42:38 +01:00
|
|
|
main()
|