Building a Python Voice-Controlled Personal Assistant

Anshu Singh

Published Nov 18, 2023

Introduction

In this article, I'll walk you through the creation of a simple yet powerful Python-based voice-controlled personal assistant. The assistant comes equipped with various functionalities, including notepad opening, web browsing, sending emails and messages, geolocation mapping, and more. It demonstrates how Python can be used to integrate with different APIs and services to create a versatile and interactive application.

import os
import webbrowser
import smtplib
import pyttsx3
import geocoder
import tweepy
from bs4 import BeautifulSoup
import requests
import pywhatkit as kit
import time
import pyautogui
import speech_recognition as sr
import wikipediaapi
from email.mime.multipart import MIMEMultipart
from email.mime.text import MIMEText
from twilio.rest import Client
from playsound import playsound
import pygame
import tweepy
from geopy.geocoders import Nominatim
import folium

def notepad():
    os.system("notepad.exe")

def open_chrome():
    webbrowser.open("http://www.google.com", new=2)


def send_email():
    recipient = input("Recipient email:")
    subject = input("Subject:")
    body = input("Body:")
    
    smtp_server = 'smtp.gmail.com'     
    smtp_port = 587                     
    sender_email = 'sendermail@gmail.com'
    sender_password = 'password_here'
    
    try:
        msg = MIMEMultipart()
        msg['From'] = sender_email
        msg['To'] = recipient
        msg['Subject'] = subject

        msg.attach(MIMEText(body, 'plain'))

        server = smtplib.SMTP(smtp_server, smtp_port)
        server.starttls()

        server.login(sender_email, sender_password)
        server.sendmail(sender_email, recipient, msg.as_string())
        server.quit()
        print("Mail sent!")
        
    except Exception as e:
        print(f"Error sending message: {str(e)}")
    

def send_message(opt):
    recipient = input("Recipient (with country code): ")
    message = input("Message:")
    
    if opt=="whats":
        
        try:
            kit.sendwhatmsg_instantly(recipient, message)
            time.sleep(20)
            pyautogui.press("enter")
            print("Message Sent!")
        except Exception as e:
            print(f"Error sending message: {str(e)}")
    elif opt=="sms":
        
        account_sid = 'account_sid'
        auth_token = 'account_token'
        twilio_phone_number = 'twilio_phone_number'

        try:
            client = Client(account_sid, auth_token)
            message = client.messages.create(
                from_=twilio_phone_number,
                body=message,
                to=recipient
            )
            print("Message sent!")
        except Exception as e:
            print(f"Error sending message: {str(e)}")


def chat_with_gpt():
    url = "https://chat.openai.com/"
    webbrowser.open(url)

def get_geolocation():
    # Get the current location based on GPS coordinates
    current_location = geocoder.ip('me')

    if current_location:
        latitude, longitude = current_location.latlng
        location_name = current_location.address if current_location.address else f"{latitude}, {longitude}"
        print(f"Current Location: {location_name}, Latitude: {latitude}, Longitude: {longitude}")

        # Create a map centered around the current coordinates
        map_location = folium.Map(location=[latitude, longitude], zoom_start=10)

        # Add a marker for the current location
        folium.Marker([latitude, longitude], tooltip=location_name).add_to(map_location)

        # Display the map
        map_location.save("current_location_map.html")
    else:
        print("Unable to determine current location.")
    
    

def get_twitter_trending(woe_id=1):
    consumer_key = 'CONSUMER_KEY'
    consumer_secret = 'CONSUMER_SECRET'
    access_token = 'ACCESS_TOKEN'
    access_token_secret = 'ACCESS_TOKEN_SECRET'

    auth = tweepy.OAuthHandler(consumer_key, consumer_secret)
    auth.set_access_token(access_token, access_token_secret)

    api = tweepy.API(auth, wait_on_rate_limit=True)
    try:

        trends = api.trends_place(id=woe_id)
        trending_topics = trends[0]['trends']

        print("Current trending topics:")
        for index, topic in enumerate(trending_topics, start=1):
            print(f"{index}. {topic['name']}")

    except tweepy.TweepError as e:
        print(f"Error: {e}")

def get_hashtag_posts(count=10):
    consumer_key = 'YOUR_CONSUMER_KEY'
    consumer_secret = 'YOUR_CONSUMER_SECRET'
    access_token = 'YOUR_ACCESS_TOKEN'
    access_token_secret = 'YOUR_ACCESS_TOKEN_SECRET'

    auth = tweepy.OAuthHandler(consumer_key, consumer_secret)
    auth.set_access_token(access_token, access_token_secret)

    api = tweepy.API(auth, wait_on_rate_limit=True)
    hashtag = input("Hashtag to search: ")
    try:
        tweets = tweepy.Cursor(api.search, q=f"#{hashtag}", lang="en").items(count)

        print(f"Top {count} posts for #{hashtag}:\n")
        for index, tweet in enumerate(tweets, start=1):
            print(f"{index}. {tweet.text}\n")

    except tweepy.TweepError as e:
        print(f"Error: {e}")

def get_wikipedia_data(lang='en'):
    wiki_wiki = wikipediaapi.Wikipedia('en') 
    topic = input("Topic to search: ") # Topic You Want to Fetch

    page = wiki_wiki.page(topic)
    if page.exists():
        print("Title:", page.title)
        print("Content:")
        print(page.text)
    else:
        print(f"The page '{topic}' does not exist on Wikipedia.")

def play_audio():
    file_path = "path/to/your/audio/file.mp3"
    try:
        playsound(file_path)
    except Exception as e:
        print(f"Error: {e}")

def play_video():
    file_path = "path/to/your/video/file.mp4"
    pygame.init()

    try:
        # Initialize Pygame
        pygame.init()

        # Set the window size based on the video resolution
        video_info = pygame.display.Info()
        screen = pygame.display.set_mode((video_info.current_w, video_info.current_h), pygame.FULLSCREEN)
        
        # Load the video
        pygame.mixer.quit()
        pygame.display.set_caption("Video Player")
        pygame.mouse.set_visible(False)

        # Create a Video object
        video = pygame.movie.Movie(file_path)
        video_screen = pygame.Surface(video.get_size()).convert()

        video.set_display(video_screen)
        video.play()

        clock = pygame.time.Clock()

        playing = True
        while playing:
            for event in pygame.event.get():
                if event.type == pygame.QUIT:
                    playing = False

            screen.blit(video_screen, (0, 0))
            pygame.display.flip()
            clock.tick(60)

            if not video.get_busy():
                playing = False

    except Exception as e:
        print(f"Error: {e}")

    pygame.quit()

def speak_text():
    text = input("Enter the text to speak: ")
    engine = pyttsx3.init()
    engine.say(text)
    engine.runAndWait()

def speech_to_text():
    recognizer = sr.Recognizer()

    with sr.Microphone() as source:
        print("Say something:")
        audio = recognizer.listen(source)

    try:
        text = recognizer.recognize_google(audio)
        print("You said:", text)
    except sr.UnknownValueError:
        print("Could not understand audio")
    except sr.RequestError as e:
        print("Error with the request to Google API; {0}".format(e))
        
def adjust_volume(text):
    if "increase volume" in text:
        pyautogui.press("volumeup")
        print("Volume increased")
    elif "decrease volume" in text:
        pyautogui.press("volumedown")
        print("Volume decreased")

def control_volume():
    recognizer = sr.Recognizer()

    with sr.Microphone() as source:
        print("Say something...")
        recognizer.adjust_for_ambient_noise(source)
        audio = recognizer.listen(source, timeout=5)

        try:
            text = recognizer.recognize_google(audio)
            print("You said:", text)
            adjust_volume(text)
        except sr.UnknownValueError:
            print("Speech Recognition could not understand audio")
        except sr.RequestError as e:
            print(f"Could not request results from Google Speech Recognition service; {e}")


while True:
    print("\n**** Menu ****")
    print("1. Notepad")
    print("2. Chrome")
    print("3. WhatsApp")
    print("4. Email")
    print("5. SMS")
    print("6. ChatGPT")
    print("7. Geolocation")
    print("8. Twitter Trending")
    print("9. Hashtag Posts")
    print("10. Wikipedia Search")
    print("11. Audio Player")
    print("12. Video Player")
    print("13. Text-to-Speech")
    print("14. Speech-to-Text")
    print("15. Control volume")
    print("0. Exit")

    choice = input("Enter your choice: ")

    if choice == '1':
        notepad()
    elif choice == '2':
        open_chrome()
    elif choice == '3':
        send_message("whats")
    elif choice == '4':
        send_email()
    elif choice == '5':
        send_message("sms")
    elif choice == '6':
        chat_with_gpt()
    elif choice == '7':
        get_geolocation()
    elif choice == '8':
        get_twitter_trending()
    elif choice == '9':
        get_hashtag_posts()
    elif choice == '10':
        get_wikipedia_data()
    elif choice == '11':
        play_audio()
    elif choice == '12':
        play_video()
    elif choice == '13':
        speak_text()
    elif choice == '14':
        speech_to_text()
    elif choice == '15':
        control_volume()
  
    elif choice == '0':
        break
    else:
        print("Invalid choice. Please try again.")

notepad():Opens the Notepad application using the os.system("notepad.exe") command.
open_chrome():Opens Google Chrome and navigates to the Google homepage using the webbrowser.open("http://www.google.com", new=2) command.
send_email():Sends an email using the SMTP protocol. The user is prompted to enter the recipient's email address, subject, and body of the email. It uses the smtplib library to interact with the SMTP server.
send_message(opt):Sends a message either through WhatsApp (opt == 'whats') or SMS (opt == 'sms'). The user is prompted to enter the recipient's phone number and the message. It uses the pywhatkit library for WhatsApp and the Twilio API for SMS.
chat_with_gpt():Opens a web browser and navigates to the OpenAI ChatGPT platform for interactive conversations.
get_geolocation():Retrieves the current geolocation based on the user's IP address using the geocoder library. It also generates a map using folium centered around the current coordinates.
get_twitter_trending(woe_id=1):Fetches and prints the current trending topics on Twitter for a specified location (default World: woe_id=1). It uses the tweepy library to interact with the Twitter API.
get_hashtag_posts(count=10):Retrieves and prints the top posts for a specified hashtag on Twitter. The user is prompted to enter the hashtag, and it uses the tweepy library.
get_wikipedia_data(lang='en'):Fetches and prints content from Wikipedia on a specified topic. The user is prompted to enter the topic, and it uses the wikipediaapi library.
play_audio():

Plays an audio file specified by the file path using the playsound library.

play_video():

Plays a video file specified by the file path using the pygame library.

speak_text():

Converts text entered by the user into speech using the pyttsx3 library.

speech_to_text():

Building a Python Voice-Controlled Personal Assistant

Anshu Singh

Introduction

Recommended by LinkedIn

Conclusion

More articles by Anshu Singh

Others also viewed

Self Build Voice Assistant !

Can the new ChatGPT competitor "Claude" - help you with coding questions?

Python Web Scraping Tips for Dynamic Element Extraction in Two Ways!

Introduction to the OpenAI API with Python

Easy multilingual Speech to Text in Python, using Google APIs

Will AI Replace Junior Developers? I Asked Experts at Pycon US

ChatGPT and Python to the Rescue: The Lazy Person's Guide to Summarizing Lengthy Texts

ChatBot in Python

Python fundamentals (Part 1): Learn by talking to AI

From Chaos to Code: How I Built Two Python Scripts with ChatGPT (and What is in the bag ?)

How to Create Engaging Chatgpt Prompts

How to Navigate ChatGPT's Output Variability

ChatGPT Prompt Strategies for Copywriting

Chatgpt's Competition With Google

ChatGPT Problem-Solving Strategies

Explore content categories

Introduction

Recommended by LinkedIn

Conclusion

More articles by Anshu Singh

AWS DMS in Practice: How I Migrate Databases with Minimal Downtime

Mastering Linux Process Management: CLI & GUI Insights for Professionals

How to Set Up a GUI on a RHEL 9 AWS EC2 Instance

Comprehensive Guide to Launching an EC2 Instance on AWS

The Undeniable Importance of Linux in the Digital World

Building an Online Code Editor: Empowering Developers Everywhere

Capturing Linux RAM with LiME: A Deep Dive into Memory Forensics

Introducing AppExpo: Your All-in-One Web App

Building a Chatbot with GPT-3: Enhancing User Interaction

Empower Your Web Experience: Introducing the Media Capture Web App

Others also viewed

Self Build Voice Assistant !

Can the new ChatGPT competitor "Claude" - help you with coding questions?

Python Web Scraping Tips for Dynamic Element Extraction in Two Ways!

Introduction to the OpenAI API with Python

Easy multilingual Speech to Text in Python, using Google APIs

Will AI Replace Junior Developers? I Asked Experts at Pycon US

ChatGPT and Python to the Rescue: The Lazy Person's Guide to Summarizing Lengthy Texts

ChatBot in Python

Python fundamentals (Part 1): Learn by talking to AI

From Chaos to Code: How I Built Two Python Scripts with ChatGPT (and What is in the bag ?)

Similar topics

How to Create Engaging Chatgpt Prompts

How to Navigate ChatGPT's Output Variability

ChatGPT Prompt Strategies for Copywriting

Chatgpt's Competition With Google

ChatGPT Problem-Solving Strategies

Explore content categories