#description: telegram bot for monitoring the system #dependencies: telebot #usage: python3 lainmonitor.py | or run it as a service #authors: hornet import subprocess import threading from time import sleep import telebot #define the variables status, hostname, uptime, zerotier, prosody, postgres, tailscale, disk, ping = 'unknown', 'unknown', 'unknown', 'unknown', 'unknown', 'unknown', 'unknown', 'unknown', 'unknown' nodes, hostnames, reach, threads = [], [], [], [] #change this to your hostname host = 'lainlounge' #load the token token = open('.env', 'r').read().strip() #bot init bot = telebot.TeleBot(token) #get system info def getinfo(): global status, hostname, uptime, zerotier, prosody, postgres, tailscale, disk hostname = subprocess.check_output(['hostname']).decode().strip() uptime = subprocess.check_output(['uptime', '-p']).decode().strip() #systemd-only services zerotier = subprocess.Popen("sudo systemctl status zerotier-one | grep 'Active'", shell=True, stdout=subprocess.PIPE).stdout.read().decode().strip() prosody = subprocess.Popen("sudo systemctl status prosody | grep 'Active'", shell=True, stdout=subprocess.PIPE).stdout.read().decode().strip() postgres = subprocess.Popen("sudo systemctl status postgresql | grep 'Active'", shell=True, stdout=subprocess.PIPE).stdout.read().decode().strip() tailscale = subprocess.Popen("sudo systemctl status tailscaled | grep 'Active'", shell=True, stdout=subprocess.PIPE).stdout.read().decode().strip() disk = subprocess.check_output(['df', '-h']).decode().strip() if hostname == 'unknown': status = 'offline' else: status = 'online' return hostname, uptime, zerotier, prosody, postgres, tailscale, disk #function to ping tailscale nodes def ping_node(node, hostname): ping = subprocess.Popen(f"ping {node} -c 1 | grep '1 packets'", shell=True, stdout=subprocess.PIPE).stdout.read().decode().strip() if '1 received' in ping: reach.append(f'{node}/{hostname} is reachable') else: reach.append(f'{node}/{hostname} is unreachable') #ping tailscale nodes def check_tailscale(): global nodes, hostnames, reach, threads, ping nodes_output = subprocess.Popen("tailscale status | grep '100'", shell=True, stdout=subprocess.PIPE).stdout.read().decode().strip() nodes = [line.split()[0] for line in nodes_output.split('\n') if line] hostnames = [line.split()[1] for line in nodes_output.split('\n') if line] for node, hostname in zip(nodes, hostnames): thread = threading.Thread(target=ping_node, args=(node, hostname)) threads.append(thread) thread.start() for thread in threads: thread.join() return reach #restart services def restart_service(service): subprocess.Popen(f'sudo systemctl restart {service}', shell=True, stdout=subprocess.PIPE).stdout.read().decode().strip() sleep(3) service_status = subprocess.Popen(f'sudo systemctl status {service} | grep "Active"', shell=True, stdout=subprocess.PIPE).stdout.read().decode().strip() message = f'{service} restarted! status: {service_status}' #restart services menu def restart_menu(): keyboard = telebot.types.ReplyKeyboardMarkup(resize_keyboard=True) zerotier_button = telebot.types.KeyboardButton('zerotier-one', callback_data='zerotier') prosody_button = telebot.types.KeyboardButton('prosody', callback_data='prosody') postgres_button = telebot.types.KeyboardButton('postgresql', callback_data='postgresql') tailscale_button = telebot.types.KeyboardButton('tailscaled', callback_data='tailscaled') return keyboard def reboot(): subprocess.Popen('sudo reboot', shell=True, stdout=subprocess.PIPE).stdout.read().decode().strip() #debug handler def check(): global status, hostname, uptime, zerotier, prosody, postgres, tailscale, disk getinfo() print('system status:', status) print('hostname:', hostname) print('uptime:', uptime) print('zerotier:', zerotier) print('prosody:', prosody) print('postgres:', postgres) print('tailscale:', tailscale) print('disk:', disk) return status, hostname, uptime, zerotier, prosody, postgres, tailscale, disk #message handling @bot.message_handler(commands=['start', 'help', 'status', 'restart', 'reboot', 'ping']) def handle(message): if message.text == '/start': bot.reply_to(message, 'lainmonitor v1.0 --- standing by...') elif message.text == '/help': bot.reply_to(message, 'commands: /start, /help, /status, /reboot, /ping') elif message.text == '/status': check() status_message = f'hostname: {hostname}\nsystem status: {status}\nuptime: {uptime}\nzerotier: {zerotier}\nprosody: {prosody}\npostgres: {postgres}\ntailscale: {tailscale}' bot.reply_to(message, status_message) bot.reply_to(message, f'filesystem info for {hostname}: \n\n{disk}') elif message.text == f'/restart {host}': if host == hostname: bot.send_message(message.chat.id, 'select a service to restart:', reply_markup=restart_menu()) else: pass elif message.text == f'/reboot {hostname}': bot.reply_to(message, f'rebooting {host}...') reboot() elif message.text == '/ping': check_tailscale() ping_status = '\n'.join(reach) bot.reply_to(message, f'ping status:\n\n{ping_status}') ping_status = '' reach.clear() #polling bot.polling()