spamcheck/spamcheck.py

465 líneas
12 KiB
Python
Original Vista normal Històric

from datetime import date, datetime, timedelta
2022-08-15 16:55:31 +02:00
#from mastodon import Mastodon
2021-07-21 14:46:27 +02:00
import time
import os
import json
import sys
import os.path
import operator
import psycopg2
2022-08-15 16:55:31 +02:00
from psycopg2 import sql
from psycopg2.extensions import ISOLATION_LEVEL_AUTOCOMMIT
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
class Spamcheck:
2022-08-15 16:55:31 +02:00
name = "Spamcheck for Mastodon social servers"
2022-08-15 16:55:31 +02:00
def __init__(self, mastodon_hostname=None, mastodon_db=None, mastodon_db_user=None, spamcheck_db=None, spamcheck_db_user=None):
2022-08-15 16:55:31 +02:00
self.config_file = 'config/config.txt'
2022-08-15 16:55:31 +02:00
is_setup = self.__check_setup(self)
2022-08-15 16:55:31 +02:00
if is_setup:
2022-08-15 16:55:31 +02:00
self.mastodon_hostname = self.__get_parameter("mastodon_hostname", self.config_file)
self.mastodon_db = self.__get_parameter("mastodon_db", self.config_file)
self.mastodon_db_user = self.__get_parameter("mastodon_db_user", self.config_file)
self.spamcheck_db = self.__get_parameter("spamcheck_db", self.config_file)
self.spamcheck_db_user = self.__get_parameter("spamcheck_db_user", self.config_file)
else:
self.mastodon_hostname, self.mastodon_db, self.mastodon_db_user, self.spamcheck_db, self.spamcheck_db_user = self.__setup(self)
db_setup = self.__check_dbsetup(self)
if not db_setup:
2022-08-15 16:55:31 +02:00
self.__createdb(self)
def new_registers(self, created_at_lst=[], id_lst=[], email_lst=[], ip_lst=[]):
try:
2022-08-15 16:55:31 +02:00
conn = None
conn = psycopg2.connect(database = self.mastodon_db, user = self.mastodon_db_user, password = "", host = "/var/run/postgresql", port = "5432")
cur = conn.cursor()
2022-08-15 16:55:31 +02:00
cur.execute("select users.created_at, users.id, users.email, users.sign_up_ip from users where users.approved and users.created_at > now() - interval '7 days'")
2022-08-15 16:55:31 +02:00
rows = cur.fetchall()
2022-08-15 16:55:31 +02:00
for row in rows:
2022-08-15 16:55:31 +02:00
if row != None:
2022-08-15 16:55:31 +02:00
created_at_lst.append(row[0])
2022-08-15 16:55:31 +02:00
id_lst.append(row[1])
email_lst.append(row[2])
ip_lst.append(row[3])
cur.close()
except (Exception, psycopg2.DatabaseError) as error:
2022-08-15 16:55:31 +02:00
print (error)
finally:
if conn is not None:
conn.close()
2022-08-15 16:55:31 +02:00
return (created_at_lst, id_lst, email_lst, ip_lst)
2022-08-15 16:55:31 +02:00
def save_registers(self, created_at_lst, id_lst, email_lst, ip_lst):
2022-08-15 16:55:31 +02:00
insert_sql = 'INSERT INTO spamcheck(created_at, id, email, ip, tor_exit_node) VALUES(%s,%s,%s,%s,%s) ON CONFLICT DO NOTHING'
i = 0
2022-08-15 16:55:31 +02:00
while i < len(id_lst):
2022-08-15 16:55:31 +02:00
is_tor_exit_node = self.__check_ip(self, ip_lst[i])
2022-08-15 16:55:31 +02:00
tor_exit_node = 't' if is_tor_exit_node == 't' else 'f'
2022-08-15 16:55:31 +02:00
conn = None
2022-08-15 16:55:31 +02:00
try:
2022-08-15 16:55:31 +02:00
conn = psycopg2.connect(database = self.spamcheck_db, user = self.spamcheck_db_user, password = "", host = "/var/run/postgresql", port = "5432")
2022-08-15 16:55:31 +02:00
cur = conn.cursor()
2022-08-15 16:55:31 +02:00
cur.execute(insert_sql, (created_at_lst[i], id_lst[i], email_lst[i], ip_lst[i], tor_exit_node))
2022-08-15 16:55:31 +02:00
conn.commit()
2022-08-15 16:55:31 +02:00
cur.close()
2022-08-15 16:55:31 +02:00
except (Exception, psycopg2.DatabaseError) as error:
2022-08-15 16:55:31 +02:00
print(error)
2022-08-15 16:55:31 +02:00
finally:
2022-08-15 16:55:31 +02:00
if conn is not None:
2022-08-15 16:55:31 +02:00
conn.close()
print(created_at_lst[i], id_lst[i], email_lst[i], ip_lst[i], tor_exit_node)
2022-08-15 16:55:31 +02:00
i += 1
2022-08-15 16:55:31 +02:00
def get_totals(self):
2022-08-15 16:55:31 +02:00
spamcheck_datetime_lst = []
2022-08-15 16:55:31 +02:00
spamcheck_registers_lst = []
2022-08-15 16:55:31 +02:00
select_sql = 'select date(created_at), count(ip) as registers from spamcheck group by date(created_at) order by date(created_at)'
2022-08-15 16:55:31 +02:00
conn = None
2022-08-15 16:55:31 +02:00
try:
2022-08-15 16:55:31 +02:00
conn = psycopg2.connect(database = self.spamcheck_db, user = self.spamcheck_db_user, password = "", host = "/var/run/postgresql", port = "5432")
2022-08-15 16:55:31 +02:00
cur = conn.cursor()
2022-08-15 16:55:31 +02:00
cur.execute(select_sql)
2022-08-15 16:55:31 +02:00
rows = cur.fetchall()
2022-08-15 16:55:31 +02:00
for row in rows:
2022-08-15 16:55:31 +02:00
spamcheck_datetime_lst.append(row[0])
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
spamcheck_registers_lst.append(row[1])
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
cur.close()
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
except (Exception, psycopg2.DatabaseError) as error:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
print(error)
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
finally:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
if conn is not None:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn.close()
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
return (spamcheck_datetime_lst, spamcheck_registers_lst)
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
def write_totals(self, spamcheck_datetime_lst, spamcheck_registers_lst):
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
insert_sql = 'INSERT INTO totals(datetime, registers) VALUES(%s,%s) ON CONFLICT (datetime) DO UPDATE SET (datetime, registers) = (EXCLUDED.datetime, EXCLUDED.registers)'
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
first_date = spamcheck_datetime_lst[0]
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
last_date = spamcheck_datetime_lst[len(spamcheck_datetime_lst)-1]
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
i = 0
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
while i < len(spamcheck_datetime_lst):
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn = None
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
try:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn = psycopg2.connect(database = self.spamcheck_db, user = self.spamcheck_db_user, password = "", host = "/var/run/postgresql", port = "5432")
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
cur = conn.cursor()
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
if first_date == spamcheck_datetime_lst[i]:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
cur.execute(insert_sql, (spamcheck_datetime_lst[i], spamcheck_registers_lst[i]))
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
i += 1
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
else:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
cur.execute(insert_sql, (first_date, '0'))
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn.commit()
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
cur.close()
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
except (Exception, psycopg2.DatabaseError) as error:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
print(error)
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
finally:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
if conn is not None:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn.close()
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
first_date = first_date + timedelta(days=1)
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
if date.today() == last_date + timedelta(days=1):
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
insert_sql = 'INSERT INTO totals(datetime, registers) VALUES(%s,%s) ON CONFLICT (datetime) DO UPDATE SET (datetime, registers) = (EXCLUDED.datetime, EXCLUDED.registers)'
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn = None
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
try:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn = psycopg2.connect(database = self.spamcheck_db, user = self.spamcheck_db_user, password = "", host = "/var/run/postgresql", port = "5432")
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
cur = conn.cursor()
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
cur.execute(insert_sql, (date.today(), '0'))
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn.commit()
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
cur.close()
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
except (Exception, psycopg2.DatabaseError) as error:
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
print(error)
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
finally:
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
if conn is not None:
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
conn.close()
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
def check_approval(self, user_id):
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
approved = False
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
try:
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
conn = None
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn = psycopg2.connect(database = self.mastodon_db, user = self.mastodon_db_user, password = "", host = "/var/run/postgresql", port = "5432")
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
cur = conn.cursor()
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
cur.execute("select approved from users where id = (%s)", (user_id,))
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
row = cur.fetchone()
2021-07-26 15:43:02 +02:00
2022-08-15 16:55:31 +02:00
if row != None:
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
approved = row[0]
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
cur.close()
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
return approved
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
except (Exception, psycopg2.DatabaseError) as error:
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
print (error)
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
finally:
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
if conn is not None:
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
conn.close()
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
@staticmethod
def __check_ip(self, ip):
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
is_tor_exit_node = 'f'
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
if ip == None:
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
return
2021-07-26 15:43:02 +02:00
2022-08-15 16:55:31 +02:00
conn = None
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
try:
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
conn = psycopg2.connect(database = self.spamcheck_db, user = self.spamcheck_db_user, password = "", host = "/var/run/postgresql", port = "5432")
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
cur = conn.cursor()
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
cur.execute('select ip from torexit_ips where ip=(%s)', (ip,))
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
row = cur.fetchone()
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
if row != None:
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
is_tor_exit_node = 't'
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
cur.close()
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
except (Exception, psycopg2.DatabaseError) as error:
2022-02-14 17:05:23 +01:00
2022-08-15 16:55:31 +02:00
print(error)
2022-02-14 17:05:23 +01:00
2022-08-15 16:55:31 +02:00
finally:
2022-02-14 17:05:23 +01:00
2022-08-15 16:55:31 +02:00
if conn is not None:
2022-02-14 17:05:23 +01:00
2022-08-15 16:55:31 +02:00
conn.close()
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
return is_tor_exit_node
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
@staticmethod
def __check_setup(self):
2022-02-14 17:05:23 +01:00
2022-08-15 16:55:31 +02:00
is_setup = False
2022-02-14 17:05:23 +01:00
2022-08-15 16:55:31 +02:00
if not os.path.isfile(self.config_file):
print(f"File {self.config_file} not found, running setup.\n")
else:
is_setup = True
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
return is_setup
@staticmethod
def __setup(self):
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
if not os.path.exists('config'):
os.makedirs('config')
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
self.mastodon_hostname = input("Mastodon hostname, in ex. 'mastodon.social': ")
self.mastodon_db = input("Mastodon's database name: ")
self.mastodon_db_user = input("Mastodon's database user: ")
self.spamcheck_db = input("Spamcheck's database name: ")
self.spamcheck_db_user = input("Spamcheck's database user: ")
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
if not os.path.exists(self.config_file):
with open(self.config_file, 'w'): pass
print(f"\n{self.config_file} created!\n")
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
with open(self.config_file, 'a') as the_file:
print(f"Writing Mastodon hostname parameter to {self.config_file}")
the_file.write(f'mastodon_hostname: {self.mastodon_hostname}\n')
the_file.write(f'mastodon_db: {self.mastodon_db}\n')
the_file.write(f'mastodon_db_user: {self.mastodon_db_user}\n')
the_file.write(f'spamcheck_db: {self.spamcheck_db}\n')
the_file.write(f'spamcheck_db_user: {self.spamcheck_db_user}\n')
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
return (self.mastodon_hostname, self.mastodon_db, self.mastodon_db_user, self.spamcheck_db, self.spamcheck_db_user)
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
@staticmethod
def __check_dbsetup(self):
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
dbsetup = False
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
try:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn = None
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn = psycopg2.connect(database = self.spamcheck_db, user = self.spamcheck_db_user, password = "", host = "/var/run/postgresql", port = "5432")
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
dbsetup = True
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
except (Exception, psycopg2.DatabaseError) as error:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
print(error)
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
return dbsetup
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
@staticmethod
def __createdb(self):
2022-01-16 14:33:44 +01:00
2021-07-21 14:46:27 +02:00
conn = None
try:
2022-08-15 16:55:31 +02:00
conn = psycopg2.connect(dbname='postgres',
user=self.spamcheck_db_user, host='',
password='')
conn.set_isolation_level(ISOLATION_LEVEL_AUTOCOMMIT)
2021-07-21 14:46:27 +02:00
cur = conn.cursor()
2022-08-15 16:55:31 +02:00
print(f"Creating database {self.spamcheck_db}. Please wait...")
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
cur.execute(sql.SQL("CREATE DATABASE {}").format(
sql.Identifier(self.spamcheck_db))
)
print(f"Database {self.spamcheck_db} created!\n")
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
self.__dbtables_schemes(self)
2021-07-21 14:46:27 +02:00
except (Exception, psycopg2.DatabaseError) as error:
print(error)
finally:
if conn is not None:
conn.close()
2022-08-15 16:55:31 +02:00
@staticmethod
def __dbtables_schemes(self):
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
table = "spamcheck"
sql = "create table "+table+" (created_at timestamptz, id bigint PRIMARY KEY, email varchar(200), ip inet, tor_exit_node boolean)"
self.__create_table(self, table, sql)
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
table = "torexit_ips"
sql = "create table "+table+" (created_at timestamptz, ip inet PRIMARY KEY)"
self.__create_table(self, table, sql)
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
table = "totals"
sql = "create table "+table+" (datetime timestamptz PRIMARY KEY, registers int)"
self.__create_table(self, table, sql)
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
@staticmethod
def __create_table(self, table, sql):
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn = None
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
try:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn = psycopg2.connect(database = self.spamcheck_db, user = self.spamcheck_db_user, password = "", host = "/var/run/postgresql", port = "5432")
cur = conn.cursor()
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
print(f"Creating table {table}")
cur.execute(sql)
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn.commit()
print(f"Table {table} created!\n")
except (Exception, psycopg2.DatabaseError) as error:
print(error)
finally:
if conn is not None:
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
conn.close()
@staticmethod
def __get_parameter(parameter, file_path ):
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
with open( file_path ) as f:
for line in f:
if line.startswith( parameter ):
return line.replace(parameter + ":", "").strip()
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
print(f'{file_path} Missing parameter {parameter}')
sys.exit(0)
2022-01-16 14:33:44 +01:00
2022-08-15 16:55:31 +02:00
###############################################################################
# main
if __name__ == '__main__':
spamcheck = Spamcheck()
created_at_lst, id_lst, email_lst, ip_lst = spamcheck.new_registers()
2021-07-21 14:46:27 +02:00
2022-08-15 16:55:31 +02:00
spamcheck.save_registers(created_at_lst, id_lst, email_lst, ip_lst)
2022-08-15 16:55:31 +02:00
spamcheck_datetime_lst, spamcheck_registers_lst = spamcheck.get_totals()
2022-08-15 16:55:31 +02:00
spamcheck.write_totals(spamcheck_datetime_lst, spamcheck_registers_lst)