telegram-moderator/bot.py

396 lines
14 KiB
Python
Raw Normal View History

2018-01-28 18:29:58 -05:00
# -*- coding: utf-8 -*-
"""Group Chat Logger
This bot is a modified version of the echo2 bot found here:
2018-01-28 18:29:58 -05:00
https://github.com/python-telegram-bot/python-telegram-bot/blob/master/examples/echobot2.py
This bot logs all messages sent in a Telegram Group to a database.
"""
2018-01-30 18:01:31 -05:00
from __future__ import print_function
import sys
2018-01-28 18:29:58 -05:00
from telegram.ext import Updater, CommandHandler, MessageHandler, Filters
import os
2018-02-09 20:13:09 -05:00
from model import User, Message, MessageHide, UserBan, session
2018-01-30 18:01:31 -05:00
from time import strftime
2018-02-01 16:54:27 -05:00
import re
2018-02-01 18:04:18 -05:00
import unidecode
2018-02-22 18:38:02 -05:00
from mwt import MWT
2020-01-27 21:24:25 -05:00
from googletrans import Translator
2020-01-27 23:26:26 -05:00
from textblob import TextBlob
2018-01-28 18:29:58 -05:00
2018-02-01 21:35:56 -05:00
class TelegramMonitorBot:
2018-02-01 16:54:27 -05:00
2018-02-09 20:24:09 -05:00
2018-02-01 21:35:56 -05:00
def __init__(self):
2018-06-28 13:22:23 -04:00
self.debug = (
2018-06-28 13:23:34 -04:00
(os.environ.get('DEBUG') is not None) and
(os.environ.get('DEBUG').lower() != "false"))
2018-02-01 23:29:58 -05:00
# Are admins exempt from having messages checked?
self.admin_exempt = (
(os.environ.get('ADMIN_EXEMPT') is not None) and
(os.environ.get('ADMIN_EXEMPT').lower() != "false"))
if (self.debug):
print("🔵 debug:", self.debug)
print("🔵 admin_exempt:", self.admin_exempt)
print("🔵 TELEGRAM_BOT_POSTGRES_URL:", os.environ["TELEGRAM_BOT_POSTGRES_URL"])
print("🔵 TELEGRAM_BOT_TOKEN:", os.environ["TELEGRAM_BOT_TOKEN"])
print("🔵 NOTIFY_CHAT:", os.environ['NOTIFY_CHAT'] if 'NOTIFY_CHAT' in os.environ else "<undefined>")
print("🔵 MESSAGE_BAN_PATTERNS:\n", os.environ['MESSAGE_BAN_PATTERNS'])
print("🔵 MESSAGE_HIDE_PATTERNS:\n", os.environ['MESSAGE_HIDE_PATTERNS'])
print("🔵 NAME_BAN_PATTERNS:\n", os.environ['NAME_BAN_PATTERNS'])
2018-06-28 12:45:17 -04:00
# Channel to notify of violoations, e.g. '@channelname'
self.notify_chat = os.environ['NOTIFY_CHAT'] if 'NOTIFY_CHAT' in os.environ else None
2018-02-01 23:02:19 -05:00
# List of chat ids that bot should monitor
2018-02-22 19:48:59 -05:00
self.chat_ids = (
list(map(int, os.environ['CHAT_IDS'].split(',')))
if "CHAT_IDS" in os.environ else [])
# Regex for message patterns that cause user ban
2018-02-01 21:35:56 -05:00
self.message_ban_patterns = os.environ['MESSAGE_BAN_PATTERNS']
2018-02-09 20:24:09 -05:00
self.message_ban_re = (re.compile(
2018-02-09 20:13:09 -05:00
self.message_ban_patterns,
re.IGNORECASE | re.VERBOSE)
2018-02-09 20:24:09 -05:00
if self.message_ban_patterns else None)
2018-02-01 16:54:27 -05:00
# Regex for message patterns that cause message to be hidden
2018-02-01 21:35:56 -05:00
self.message_hide_patterns = os.environ['MESSAGE_HIDE_PATTERNS']
2018-02-09 20:24:09 -05:00
self.message_hide_re = (re.compile(
2018-02-09 20:13:09 -05:00
self.message_hide_patterns,
re.IGNORECASE | re.VERBOSE)
2018-02-09 20:24:09 -05:00
if self.message_hide_patterns else None)
2018-02-01 18:04:18 -05:00
# Regex for name patterns that cause user to be banned
2018-02-01 23:02:19 -05:00
self.name_ban_patterns = os.environ['NAME_BAN_PATTERNS']
2018-02-09 20:24:09 -05:00
self.name_ban_re = (re.compile(
2018-02-09 20:13:09 -05:00
self.name_ban_patterns,
re.IGNORECASE | re.VERBOSE)
2018-02-09 20:24:09 -05:00
if self.name_ban_patterns else None)
2018-02-01 23:02:19 -05:00
2018-02-22 18:38:02 -05:00
@MWT(timeout=60*60)
def get_admin_ids(self, bot, chat_id):
""" Returns a list of admin IDs for a given chat. Results are cached for 1 hour. """
2018-02-22 18:38:02 -05:00
return [admin.user.id for admin in bot.get_chat_administrators(chat_id)]
2018-02-01 23:02:19 -05:00
def ban_user(self, update):
2018-02-05 18:19:44 -05:00
""" Ban user """
2018-02-02 14:06:44 -05:00
kick_success = update.message.chat.kick_member(update.message.from_user.id)
2018-02-01 23:02:19 -05:00
2018-02-01 23:29:58 -05:00
2018-02-01 22:11:15 -05:00
def security_check_username(self, bot, update):
2018-02-01 23:02:19 -05:00
""" Test username for security violations """
full_name = "{} {}".format(
update.message.from_user.first_name,
update.message.from_user.last_name)
2018-02-09 20:13:09 -05:00
if self.name_ban_re and self.name_ban_re.search(full_name):
# Logging
2018-06-28 12:45:17 -04:00
log_message = "❌ 🙅‍♂️ BAN MATCH FULL NAME: {}".format(full_name.encode('utf-8'))
2018-02-01 23:29:58 -05:00
if self.debug:
update.message.reply_text(log_message)
print(log_message)
# Ban the user
2018-02-01 23:02:19 -05:00
self.ban_user(update)
# Log in database
s = session()
userBan = UserBan(
user_id=update.message.from_user.id,
reason=log_message)
s.add(userBan)
s.commit()
s.close()
# Notify channel
bot.sendMessage(chat_id=self.notify_chat, text=log_message)
2018-02-01 23:02:19 -05:00
2018-02-09 20:13:09 -05:00
if self.name_ban_re and self.name_ban_re.search(update.message.from_user.username or ''):
# Logging
2018-06-28 12:45:17 -04:00
log_message = "❌ 🙅‍♂️ BAN MATCH USERNAME: {}".format(update.message.from_user.username.encode('utf-8'))
2018-02-01 23:29:58 -05:00
if self.debug:
update.message.reply_text(log_message)
print(log_message)
# Ban the user
2018-02-01 23:02:19 -05:00
self.ban_user(update)
# Log in database
s = session()
userBan = UserBan(
user_id=update.message.from_user.id,
reason=log_message)
s.add(userBan)
s.commit()
s.close()
# Notify channel
bot.sendMessage(chat_id=self.notify_chat, text=log_message)
2018-02-01 18:04:18 -05:00
2018-02-09 20:13:09 -05:00
2018-02-01 21:35:56 -05:00
def security_check_message(self, bot, update):
""" Test message for security violations """
2018-02-01 16:54:27 -05:00
if not update.message.text:
return
2018-02-01 21:35:56 -05:00
# Remove accents from letters (é->e, ñ->n, etc...)
message = unidecode.unidecode(update.message.text)
# TODO: Replace lookalike unicode characters:
# https://github.com/wanderingstan/Confusables
2018-02-01 16:54:27 -05:00
# Hide forwarded messages
if update.message.forward_date is not None:
# Logging
log_message = "❌ HIDE FORWARDED: {}".format(update.message.text.encode('utf-8'))
if self.debug:
update.message.reply_text(log_message)
print(log_message)
# Delete the message
update.message.delete()
# Log in database
s = session()
messageHide = MessageHide(
user_id=update.message.from_user.id,
message=update.message.text)
s.add(messageHide)
s.commit()
s.close()
# Notify channel
bot.sendMessage(chat_id=self.notify_chat, text=log_message)
2018-02-09 20:13:09 -05:00
if self.message_ban_re and self.message_ban_re.search(message):
# Logging
2018-06-28 12:45:17 -04:00
log_message = "❌ 🙅‍♂️ BAN MATCH: {}".format(update.message.text.encode('utf-8'))
2018-02-01 23:29:58 -05:00
if self.debug:
update.message.reply_text(log_message)
print(log_message)
2018-02-06 13:29:46 -05:00
# Any message that causes a ban gets deleted
update.message.delete()
# Ban the user
self.ban_user(update)
2018-02-09 20:13:09 -05:00
# Log in database
s = session()
userBan = UserBan(
user_id=update.message.from_user.id,
reason=update.message.text)
s.add(userBan)
s.commit()
s.close()
# Notify channel
bot.sendMessage(chat_id=self.notify_chat, text=log_message)
elif self.message_hide_re and self.message_hide_re.search(message):
# Logging
2018-06-28 12:45:17 -04:00
log_message = "❌ 🙈 HIDE MATCH: {}".format(update.message.text.encode('utf-8'))
if self.debug:
update.message.reply_text(log_message)
print(log_message)
# Delete the message
update.message.delete()
# Log in database
s = session()
messageHide = MessageHide(
user_id=update.message.from_user.id,
message=update.message.text)
s.add(messageHide)
s.commit()
s.close()
# Notify channel
bot.sendMessage(chat_id=self.notify_chat, text=log_message)
2018-01-28 18:29:58 -05:00
2018-10-18 20:30:28 -04:00
def attachment_check(self, bot, update):
""" Hide messages with attachments (except photo or video) """
if (update.message.audio or
update.message.document or
update.message.game or
update.message.voice):
# Logging
if update.message.document:
log_message = "❌ HIDE DOCUMENT: {}".format(update.message.document.__dict__)
else:
log_message = "❌ HIDE NON-DOCUMENT ATTACHMENT"
2018-10-18 20:30:28 -04:00
if self.debug:
update.message.reply_text(log_message)
print(log_message)
# Delete the message
update.message.delete()
# Log in database
s = session()
messageHide = MessageHide(
user_id=update.message.from_user.id,
message=update.message.text)
s.add(messageHide)
s.commit()
s.close()
# Notify channel
bot.sendMessage(chat_id=self.notify_chat, text=log_message)
2018-02-01 21:35:56 -05:00
def logger(self, bot, update):
""" Primary Logger. Handles incoming bot messages and saves them to DB """
2018-02-01 22:11:15 -05:00
try:
user = update.message.from_user
# Limit bot to monitoring certain chats
if update.message.chat_id not in self.chat_ids:
print("Message from user {} is from chat_id not being monitored: {}".format(
user.id,
update.message.chat_id)
)
return
2018-02-09 20:24:09 -05:00
2018-02-01 22:11:15 -05:00
if self.id_exists(user.id):
2020-01-24 20:51:34 -05:00
self.log_message(user.id, update.message.text,
update.message.chat_id)
2018-02-01 21:35:56 -05:00
else:
2018-02-09 20:13:09 -05:00
add_user_success = self.add_user(
user.id,
user.first_name,
user.last_name,
user.username)
2018-02-01 22:11:15 -05:00
if add_user_success:
2020-01-24 20:51:34 -05:00
self.log_message(
user.id, update.message.text, update.message.chat_id)
2018-02-01 22:11:15 -05:00
print("User added: {}".format(user.id))
else:
print("Something went wrong adding the user {}".format(user.id), file=sys.stderr)
user_name = (
user.username or
"{} {}".format(user.first_name, user.last_name) or
"<none>").encode('utf-8')
2018-02-01 22:11:15 -05:00
if update.message.text:
print("{} {} ({}) : {}".format(
strftime("%Y-%m-%dT%H:%M:%S"),
user.id,
user_name,
2018-02-01 22:11:15 -05:00
update.message.text.encode('utf-8'))
)
2018-10-18 20:30:28 -04:00
else:
print("{} {} ({}) : non-message".format(
strftime("%Y-%m-%dT%H:%M:%S"),
user.id,
user_name)
2018-10-18 20:30:28 -04:00
)
2018-02-01 21:35:56 -05:00
# Don't check admin activity
is_admin = update.message.from_user.id in self.get_admin_ids(bot, update.message.chat_id)
if is_admin and self.admin_exempt:
print("👮‍♂️ Skipping checks. User is admin: {}".format(user.id))
else:
2018-02-01 23:10:09 -05:00
# Security checks
2020-02-24 21:04:26 -05:00
print(json.dumps(update))
2018-10-18 20:30:28 -04:00
self.attachment_check(bot, update)
2018-02-01 23:10:09 -05:00
self.security_check_username(bot, update)
self.security_check_message(bot, update)
2018-02-01 23:02:19 -05:00
2018-02-01 21:35:56 -05:00
except Exception as e:
2018-02-09 20:24:09 -05:00
print("Error: {}".format(e))
2018-10-18 20:30:28 -04:00
print('Error on line {}'.format(sys.exc_info()[-1].tb_lineno), type(e).__name__, e)
2018-02-01 21:35:56 -05:00
# DB queries
def id_exists(self, id_value):
s = session()
bool_set = False
for id1 in s.query(User.id).filter_by(id=id_value):
if id1:
bool_set = True
2018-01-28 18:29:58 -05:00
2018-02-01 21:35:56 -05:00
s.close()
2018-02-01 16:54:27 -05:00
2018-02-01 21:35:56 -05:00
return bool_set
2018-01-28 18:29:58 -05:00
2020-01-24 20:51:34 -05:00
def log_message(self, user_id, user_message, chat_id):
2018-02-01 21:35:56 -05:00
try:
s = session()
2020-01-27 21:24:25 -05:00
language_code = english_message = ""
2020-01-27 23:26:26 -05:00
polarity = subjectivity = 0.0
2020-01-27 21:24:25 -05:00
try:
2020-01-27 23:26:26 -05:00
# translate to English & log the original language
2020-01-27 21:24:25 -05:00
translator = Translator()
translated = translator.translate(user_message)
language_code = translated.src
english_message = translated.text
2020-01-27 23:26:26 -05:00
# run basic sentiment analysis on the translated English string
analysis = TextBlob(english_message)
polarity = analysis.sentiment.polarity
subjectivity = analysis.sentiment.subjectivity
2020-01-27 21:24:25 -05:00
except Exception as e:
print(e.message)
2020-01-27 23:26:26 -05:00
msg1 = Message(user_id=user_id, message=user_message, chat_id=chat_id,
language_code=language_code, english_message=english_message, polarity=polarity,
subjectivity=subjectivity)
2018-02-01 21:35:56 -05:00
s.add(msg1)
s.commit()
s.close()
except Exception as e:
2018-02-09 20:24:09 -05:00
print("Error: {}".format(e))
2018-02-01 21:35:56 -05:00
def add_user(self, user_id, first_name, last_name, username):
try:
s = session()
user = User(
id=user_id,
first_name=first_name,
last_name=last_name,
username=username)
s.add(user)
s.commit()
s.close()
return self.id_exists(user_id)
2018-02-01 21:35:56 -05:00
except Exception as e:
2018-02-09 20:24:09 -05:00
print("Error: {}".format(e))
2018-02-01 21:35:56 -05:00
def error(self, bot, update, error):
""" Log Errors caused by Updates. """
2018-02-01 21:35:56 -05:00
print("Update '{}' caused error '{}'".format(update, error),
file=sys.stderr)
2018-01-28 18:29:58 -05:00
2018-02-01 21:35:56 -05:00
def start(self):
""" Start the bot. """
2018-01-28 18:29:58 -05:00
2018-02-01 21:35:56 -05:00
# Create the EventHandler and pass it your bot's token.
updater = Updater(os.environ["TELEGRAM_BOT_TOKEN"])
2018-01-28 18:29:58 -05:00
2018-02-01 21:35:56 -05:00
# Get the dispatcher to register handlers
dp = updater.dispatcher
2018-01-28 18:29:58 -05:00
2018-02-01 21:35:56 -05:00
# on different commands - answer in Telegram
2018-01-28 18:29:58 -05:00
2018-02-01 21:35:56 -05:00
# on noncommand i.e message - echo the message on Telegram
2018-02-01 22:11:15 -05:00
dp.add_handler(MessageHandler(
2018-10-18 20:30:28 -04:00
Filters.all,
2018-02-01 22:11:15 -05:00
lambda bot, update : self.logger(bot, update)
))
2018-02-01 21:35:56 -05:00
# dp.add_handler(MessageHandler(Filters.status_update, status))
2018-01-28 18:29:58 -05:00
2018-02-01 21:35:56 -05:00
# log all errors
2018-02-01 22:11:15 -05:00
dp.add_error_handler(
lambda bot, update, error : self.error(bot, update, error)
)
2018-01-28 18:29:58 -05:00
2018-02-01 21:35:56 -05:00
# Start the Bot
updater.start_polling()
2018-01-28 18:29:58 -05:00
print("Bot started. Montitoring chats: {}".format(self.chat_ids))
2018-01-29 00:41:12 -05:00
2018-02-01 21:35:56 -05:00
# Run the bot until you press Ctrl-C or the process receives SIGINT,
# SIGTERM or SIGABRT. This should be used most of the time, since
# start_polling() is non-blocking and will stop the bot gracefully.
updater.idle()
2018-01-28 18:29:58 -05:00
if __name__ == '__main__':
2018-02-01 21:35:56 -05:00
c = TelegramMonitorBot()
c.start()