Skip to content
Home

Collection of `python` script for automating tasks

Part 1 video

Get Youtube subscribers count

pip install requests bs4
import re
import requests
from bs4 import BeautifulSoup
url = "https://www.youtube.com/@SanthoshBalajiRamesh"
# Headers with Accept-Language set to en-US
headers = {
"Accept-Language": "en-US,en;q=0.9"
}
soup = BeautifulSoup(requests.get(url, headers=headers).content, "html.parser")
# print(soup.prettify())
# Use regex to find the number
match = re.search(r'"content":\s*"\b([\d.]+[MK]?)\b\s*subscribers"', soup.prettify())
if match:
subscriber_count = match.group(1)
print("Subscriber Count:", subscriber_count)
else:
print("Subscriber count not found!")

Extract all images from the website

pip install requests bs4
import shutil
import requests
from pathlib import Path
from bs4 import BeautifulSoup
from urllib.parse import urljoin
# Function to get the safe URL from an img tag's src
def get_safe_url(src, base_url):
if src.startswith("/"):
return urljoin(base_url, src)
elif not src.startswith(("http://", "https://")):
return f"https://{src}"
return src
# Fetch the webpage content
base_url = "https://santhosh2r2.github.io"
url = base_url +"/youtube/blog/vagrant-migration"
#base_url = "https://google.de"
#url = base_url +"/"
# Destination folder
destination_folder = Path("img")
if destination_folder.exists():
shutil.rmtree(destination_folder)
destination_folder.mkdir(parents=True, exist_ok=True)
response = requests.get(url)
soup = BeautifulSoup(response.content, "html.parser")
# Iterate over all img tags and download images
for i, img in enumerate(soup.find_all("img")):
img_src = img.get("src")
# Ignoring "src" which starts with "data",
# incase of svg or base64 encoded string
if not img_src.startswith("data"):
safe_url = get_safe_url(img_src, base_url)
img_data = requests.get(safe_url).content
filename = Path(img_src).name
with open(destination_folder / filename, 'wb') as file:
file.write(img_data)
print(img_src)
print("Images downloaded successfully.")

Convert Images to PDF

pip install Pillow
from PIL import Image
import os
def images_to_pdf(image_folder, output_pdf):
image_list = []
for file_name in os.listdir(image_folder):
if file_name.endswith((".png", ".jpg", ".jpeg", "gif", "webp")):
print(file_name)
image_path = os.path.join(image_folder, file_name)
image = Image.open(image_path).convert('RGB')
image_list.append(image)
if image_list:
image_list[0].save(output_pdf, save_all=True, append_images=image_list[1:])
print(f"PDF created: {output_pdf}")
else:
print("No images found.")
images_to_pdf("img", "output.pdf")

Part 2 video

Clipboard logger

# pip install pyperclip
import pyperclip
import time
def log_clipboard():
previous = ""
while True:
current = pyperclip.paste()
if current != previous:
with open("output\clipboard_log.txt", "a") as log:
log.write(f"{current}\n")
previous = current
time.sleep(1)
log_clipboard()

Break Reminder

# pip install plyer
import time
from plyer import notification
def break_notifier():
while True:
notification.notify(
title="Self-Reminder: BREAK TIME",
message="Stand up, strech and save your back.",
timeout=2
)
time.sleep(5)
break_notifier()

Unseen E-Mails

import imaplib
import os
from dotenv import load_dotenv
load_dotenv()
gmail_user = os.getenv("GMAIL_USER")
gmail_password = os.getenv("GMAIL_PASSWORD")
def unseen_emails():
mail = imaplib.IMAP4_SSL("imap.gmail.com")
mail.login(gmail_user, gmail_password)
mail.select("inbox")
result, data = mail.search(None, 'UNSEEN')
emails = data[0].split()
print(f"You have {len(emails)} unread emails.")
unseen_emails()

Find space

import shutil
def check_disk_usage(folder):
total, used, free = shutil.disk_usage(folder)
print(f"Folder: {folder}, Free Space: {free // (2**30)} GB")
check_disk_usage("C:")

Screenshot generator

# pip install pillow pyautogui
import pyautogui
import time
def take_screenshots():
while True:
screenshot = pyautogui.screenshot()
screenshot.save(f'output\\screenshots\\primary_monitor_{time.time()}.png')
print("Screenshot saved.")
time.sleep(5) # Every 5 seconds
take_screenshots()

Part 3 video

Send WhatsApp message

# Importing the Required Library
import pywhatkit
# Defining the Phone Number and Message
phone_number = "" # Enter the phone number
message = "Hi, this is a test message!"
# Sending the message via whatsapp message
pywhatkit.sendwhatmsg(
phone_number,
message,
time_hour=datetime.datetime.now().hour,
time_min=datetime.datetime.now().minute + 1,
wait_time=10,
tab_close=False
)
# Sending the image via whatsapp message
pywhatkit.sendwhats_image(phone_number,"image.png", message,
wait_time=10, tab_close=True)
# Displaying a Success Message
print("WhatsApp message sent!")

DNS Lookup

import dns.resolver # pip install dnspython
from termcolor import colored # pip install termcolor
def check_dns_records(domain):
record_types = ['A', 'AAAA', 'MX', 'CNAME', 'TXT', 'NS', 'SOA']
resolver = dns.resolver.Resolver()
results = {}
for record_type in record_types:
try:
answer = resolver.resolve(domain, record_type)
results[record_type] = [str(rdata) for rdata in answer]
except (dns.resolver.NoAnswer, dns.resolver.NXDOMAIN, dns.resolver.NoNameservers):
results[record_type] = []
except Exception as e:
results[record_type] = str(e)
return results
def display_results(domain, results):
print("\n" + colored(f"DNS Records for {domain}", "cyan", attrs=["bold"]))
print("=" * (len(f"DNS Records for {domain}") + 2))
if 'error' in results:
print(colored(f"Error: {results['error']}", "red"))
return
record_titles = {
"A": "IPv4 Addresses",
"AAAA": "IPv6 Addresses",
"MX": "Mail Exchanger",
"CNAME": "Canonical Name",
"TXT": "Text Records",
"NS": "Name Servers",
"SOA": "Start of Authority"
}
for record_type, record_data in results.items():
print(f"\n{colored(record_titles.get(record_type, record_type), 'yellow', attrs=['bold'])}:")
if record_data:
for record in record_data:
print(f" - {colored(record, 'green')}")
else:
print(colored(" Not found", "red"))
print("\n" + "=" * 40)
if __name__ == "__main__":
domain = input("Enter domain to check DNS records: ").strip()
results = check_dns_records(domain)
display_results(domain, results)

Task Reminder

import tkinter as tk
from tkinter import ttk
import csv
import time
import threading
from datetime import datetime, timedelta
from win10toast import ToastNotifier
reminders = [] # List to store all reminders
def check_reminders():
while True:
current_time = datetime.now()
for reminder in reminders[:]:
if current_time >= reminder["remind_time"]:
show_custom_notification(reminder["task_name"], reminder["description"])
reminders.remove(reminder)
time.sleep(10)
threading.Thread(target=check_reminders, daemon=True).start()
def show_custom_notification(task_name, description):
toaster = ToastNotifier()
toaster.show_toast(
title=f"Reminder: {task_name}",
msg=f"Description: {description}",
icon_path="icon.ico",
duration=10,
threaded=True
)
def set_reminder():
task_name = task_name_entry.get()
description = description_entry.get("1.0", tk.END).strip()
time_minutes = float(time_entry.get())
remind_time = datetime.now() + timedelta(minutes=time_minutes)
print(f'''
Task Name: {task_name}\n
Task Description: {description} \n
Remind Time: {remind_time}\n''')
print('Task added! I will remind you when the time comes.')
reminders.append({
"task_name": task_name,
"description": description,
"remind_time": remind_time
})
with open('reminders.csv', 'a', newline='') as file:
writer = csv.writer(file)
writer.writerow([task_name, description, remind_time])
clear_form_fields()
def clear_form_fields():
task_name_entry.delete(0, tk.END)
description_entry.delete("1.0", tk.END)
time_entry.delete(0, tk.END)
def create_gui():
global task_name_entry, description_entry, time_entry
root = tk.Tk()
root.title("Task Reminder")
root.geometry("500x400")
root.configure(bg="#ebebeb")
title_frame = tk.Frame(root, bg="#1f6abf", pady=10)
title_frame.pack(fill="x")
title_label = tk.Label(title_frame, text="Task Reminder", font=("Arial", 16, "bold"), fg="white", bg="#1f6abf")
title_label.pack()
form_frame = ttk.Frame(root, padding="20 20 20 10")
form_frame.pack(fill="both", expand=True, padx=20, pady=20)
ttk.Label(form_frame, text="Task Name:", font=("Arial", 10)).grid(row=0, column=0, sticky=tk.W, pady=5)
task_name_entry = ttk.Entry(form_frame, width=40, font=("Arial", 10))
task_name_entry.grid(row=0, column=1, padx=5, pady=5)
ttk.Label(form_frame, text="Description:", font=("Arial", 10)).grid(row=1, column=0, sticky=tk.W, pady=5)
description_entry = tk.Text(form_frame, width=40, height=4, font=("Arial", 10))
description_entry.grid(row=1, column=1, padx=5, pady=5)
ttk.Label(form_frame, text="Time to Remind (minutes):", font=("Arial", 10)).grid(row=2, column=0, sticky=tk.W, pady=5)
time_entry = ttk.Entry(form_frame, width=40, font=("Arial", 10))
time_entry.grid(row=2, column=1, padx=5, pady=5)
button_frame = tk.Frame(root, bg="#ebebeb")
button_frame.pack(pady=10)
set_button = tk.Button(button_frame, text="Set Reminder", command=set_reminder, font=("Arial", 10, "bold"), bg="#1f6abf", fg="white", width=15)
set_button.pack(side="left", padx=10)
add_button = tk.Button(button_frame, text="Clear", command=clear_form_fields, font=("Arial", 10, "bold"), bg="#dadada", fg="black", width=15)
add_button.pack(side="left", padx=10)
root.mainloop()
if __name__ == "__main__":
create_gui()

Part 4 video

Archive older files

def archive_older_files(folder, days=30):
import os
import shutil
from datetime import datetime, timedelta
def clean_downloads(folder_path, days):
# Create Archive folder if it doesn't exist
archive_folder = os.path.join(folder_path, "Archive")
if not os.path.exists(archive_folder):
os.makedirs(archive_folder)
# Calculate the threshold date
now = datetime.now()
threshold = now - timedelta(days=days)
# Iterate over files in the folder
for filename in os.listdir(folder_path):
file_path = os.path.join(folder_path, filename)
# Check if it's a file and not a directory
if os.path.isfile(file_path):
# Get the last modified time of the file
file_mtime = datetime.fromtimestamp(os.path.getmtime(file_path))
# Move the file to Archive if it's older than the threshold
if file_mtime < threshold:
shutil.move(file_path, os.path.join(archive_folder, filename))
clean_downloads(folder, days)
archive_older_files(r"path\to\folder", 30)

Organize folder

def organize_folder(folder):
import os
import shutil
def organize_files(folder_path):
# Iterate over files in the folder
for filename in os.listdir(folder_path):
# Get the file extension
ext = filename.split('.')[-1]
# Create a folder for the extension if it doesn't exist
ext_folder = os.path.join(folder_path, ext.upper())
os.makedirs(ext_folder, exist_ok=True)
# Move the file to the extension folder
shutil.move(os.path.join(folder_path, filename), os.path.join(ext_folder, filename))
organize_files(folder)
organize_folder(r"path\to\folder")

Merge PDF files

def merge_pdf_files(folder_path):
# pip install PyPDF2
from PyPDF2 import PdfMerger
import os
def get_pdf_files(folder):
return [os.path.join(folder_path, f) for f in os.listdir(folder) if f.endswith('.pdf')]
def merge_pdfs(pdf_list, output):
merger = PdfMerger()
for pdf in pdf_list:
merger.append(pdf)
merger.write(output)
merger.close()
#folder_path = r"C:\Users\Santhosh Balaji R\Downloads\PDF"
pdf_files = get_pdf_files(folder_path)
print(pdf_files)
merge_pdfs(pdf_files, r'output\merged.pdf')
merge_pdf_files(r"path\to\folder")

Convert CSV files to Excel files

def batch_convert_csv_to_excel(folder):
# pip install pandas openpyxl
import os
import pandas as pd
def csv_to_excel_folder(folder_path):
for filename in os.listdir(folder_path):
if filename.endswith('.csv'):
csv_file = os.path.join(folder_path, filename)
excel_file = os.path.join(folder_path, filename.replace('.csv', '.xlsx'))
try:
df = pd.read_csv(csv_file)
df.to_excel(excel_file, index=False)
print(f"Converted: {csv_file} -> {excel_file}")
except Exception as e:
print(f"Failed to convert {csv_file}: {e}")
csv_to_excel_folder(folder)
batch_convert_csv_to_excel(r"path\to\folder")

Rename multiple files at once

def batch_rename_files(folder, name):
import os
def rename_files(folder_path, prefix):
for count, filename in enumerate(os.listdir(folder_path)):
ext = filename.split('.')[-1]
new_name = f"{prefix}_{count}.{ext}"
os.rename(os.path.join(folder_path, filename), os.path.join(folder_path, new_name))
rename_files(folder, name)
batch_rename_files(r"path\to\folder", "Document")

Part 5 video

Email inbox cleaner

def email_inbox_cleaner():
import imaplib
# Connect to the email server
mail = imaplib.IMAP4_SSL('imap.gmail.com')
mail.login('username', 'password')
# Select the inbox
mail.select('inbox')
# Search for emails with "unsubscribe" in the subject
status, messages = mail.search(None, 'SUBJECT "outlook"')
# Mark emails for deletion
for num in messages[0].split():
mail.store(num, '+FLAGS', '\\Deleted')
print(num)
print(mail)
# Permanently delete marked emails
mail.expunge()
mail.logout()
email_inbox_cleaner()

Summarize expenses

def summarize_expenses():
import pandas as pd
# Load the bank statement
# Ensure your bank statement CSV has 'Description' and 'Amount' columns
data = pd.read_csv(r'bank_statement.csv', sep=",")
# Categorize expenses based on keywords in the description
def categorize(description):
if 'restaurant' in description.lower():
return 'Food'
elif 'uber' in description.lower() or 'taxi' in description.lower():
return 'Transport'
elif 'amazon' in description.lower():
return 'Shopping'
else:
return 'Other'
data['Category'] = data['Description'].apply(categorize)
# Summarize expenses by category
summary = data.groupby('Category')['Amount'].sum()
print(summary)
summarize_expenses()

Password generator

def generate_password(length=15):
import random
import string
# Define reusable character pools
LETTERS = string.ascii_letters # a-z, A-Z
DIGITS = string.digits # 0-9
SPECIAL_CHARACTERS = "!@#$%^&*()-_=+[]{}|;:',.<>?/`~"
# Combine pools to create the character set
characters = LETTERS + DIGITS + SPECIAL_CHARACTERS
# Randomly choose characters to form the password
return ''.join(random.choice(characters) for _ in range(length))
print(generate_password())