From 5098bf7bff37ef6650b8353900020309ad868846 Mon Sep 17 00:00:00 2001
From: arjundontflex <90552791+arjundontflex@users.noreply.github.com>
Date: Fri, 12 Jul 2024 09:07:57 +0530
Subject: [PATCH] Enhance Error Handling and Dynamic Dialog Generation

---
 The Prototype/app.py | 281 +++++++++++++++++--------------------------
 1 file changed, 112 insertions(+), 169 deletions(-)

diff --git a/The Prototype/app.py b/The Prototype/app.py
index 1b4ec2d..57598e8 100644
--- a/The Prototype/app.py	
+++ b/The Prototype/app.py	
@@ -8,11 +8,14 @@
 import pyttsx3
 import threading
 import traceback
+import logging
+
+# Initialize logging
+logging.basicConfig(level=logging.DEBUG, filename='game.log', filemode='w', format='%(name)s - %(levelname)s - %(message)s')
 
 # Initialize Pygame
 pygame.init()
 
-
 # Gemini LLM
 with open('config_keys.json') as f:
     config = json.load(f)
@@ -20,18 +23,17 @@
 genai.configure(api_key=api_key)
 model = genai.GenerativeModel('gemini-pro')
 
-
 screen_width = 1300
 screen_height = 600
 screen = pygame.display.set_mode((screen_width, screen_height))
 bg_img = pygame.image.load("background.jpg")
-bg_img = pygame.transform.scale(bg_img,(int(bg_img.get_width()*(screen_height/bg_img.get_height())),screen_height))
-rep = math.ceil(screen_width/bg_img.get_width())
-print(rep)
+bg_img = pygame.transform.scale(bg_img, (int(bg_img.get_width() * (screen_height / bg_img.get_height())), screen_height))
+rep = math.ceil(screen_width / bg_img.get_width())
+logging.info(f'Background repetition count: {rep}')
 
 pygame.display.set_caption("SuperSpeechSaga")
 
-player_image = [pygame.image.load("character/sprite_0.png"),pygame.image.load("character/sprite_1.png")]
+player_image = [pygame.image.load("character/sprite_0.png"), pygame.image.load("character/sprite_1.png")]
 player_rect = player_image[0].get_rect()
 player_rect.x = 50
 player_rect.y = 350
@@ -40,19 +42,19 @@
 JUMP_FORCE = -10
 font = pygame.font.Font(None, 24)
 
-villager_image = [pygame.image.load("side_character1/sprite_0.png"),pygame.image.load("character/sprite_1.png")]
+villager_image = [pygame.image.load("side_character1/sprite_0.png"), pygame.image.load("character/sprite_1.png")]
 villager_rect = player_image[0].get_rect()
 villager_rect.x = 500
 villager_rect.y = 350
 villager_text = "Villager 1 says: Hi"
-villager_text_surface = font.render(villager_text, True, (255, 255, 255))
+villager_text_surface = font.render(villager_text, True, WHITE)
 
 villager2_image = [pygame.image.load("side_character1/sprite_1.png")]
 villager2_rect = player_image[0].get_rect()
 villager2_rect.x = 750
 villager2_rect.y = 295
 villager2_text = "Villager 2 says: Hi"
-villager2_text_surface = font.render(villager2_text, True, (255, 255, 255))
+villager2_text_surface = font.render(villager2_text, True, WHITE)
 
 font2 = pygame.font.Font(None, 16)
 villager3_image = [pygame.image.load("side_character1/sprite_2.png")]
@@ -60,10 +62,9 @@
 villager3_rect.x = 150
 villager3_rect.y = 295
 villager3_text = "About the game"
-villager3_text_surface = font2.render(villager3_text, True, (255, 255, 255))
-
+villager3_text_surface = font2.render(villager3_text, True, WHITE)
 
-info_image = [pygame.image.load("assets/info.png"),pygame.image.load("assets/info_complete.png")]
+info_image = [pygame.image.load("assets/info.png"), pygame.image.load("assets/info_complete.png")]
 info_image_rect = info_image[0].get_rect()
 
 check_point = pygame.image.load("assets/check_point.png")
@@ -71,27 +72,22 @@
 check_point_rect.x = 1100
 check_point_rect.y = 350
 
-
+engine = pyttsx3.init()
 
 def perform_speech(prompt, villager):
+    global villager_text, villager2_text, villager3_text, e_not_yet_pressed, e_not_yet_pressed2
 
-    global villager_text
-    global villager2_text
-    global villager3_text
-    global e_not_yet_pressed
-    global e_not_yet_pressed2
-
-    if villager==0:
-        villager_text=f"..."
-    elif villager==1:
-        villager2_text=f"..."
-    elif villager==2:
-        villager3_text=f"..."
+    if villager == 0:
+        villager_text = f"..."
+    elif villager == 1:
+        villager2_text = f"..."
+    elif villager == 2:
+        villager3_text = f"..."
 
     try:
         # Gemini
         response = model.generate_content(prompt)
-        print(response.text)
+        logging.info(f'Response: {response.text}')
 
         res_text = response.text
 
@@ -101,32 +97,30 @@ def perform_speech(prompt, villager):
 
         dialog = json.loads(res_text)["dialog"]
 
-        print(dialog)
+        logging.info(f'Dialog: {dialog}')
 
-        if villager==0:
-            villager_text=f"Villager 1 says: {dialog}"
-        elif villager==1:
-            villager2_text=f"Villager 2 says: {dialog}"
-        elif villager==2:
-            villager3_text=f"Villager 3 says: {dialog}"
+        if villager == 0:
+            villager_text = f"Villager 1 says: {dialog}"
+        elif villager == 1:
+            villager2_text = f"Villager 2 says: {dialog}"
+        elif villager == 2:
+            villager3_text = f"Villager 3 says: {dialog}"
 
         # Pyttsx3
-        engine = pyttsx3.init()
         voices = engine.getProperty('voices')
-        engine.setProperty('voice', voices[villager%2].id)
-        print(dialog)
+        engine.setProperty('voice', voices[villager % 2].id)
+        logging.info(dialog)
         engine.say(dialog)
         engine.runAndWait()
     except Exception as e:
-        traceback.print_exc() 
-        if villager==0:
+        logging.error(traceback.format_exc())
+        if villager == 0:
             e_not_yet_pressed = True
         else:
             e_not_yet_pressed = True
-    
 
 def fall(player_rect):
-    if player_rect.y<350:
+    if player_rect.y < 350:
         player_rect.y += GRAVITY
 
 def divide_text(string):
@@ -142,6 +136,51 @@ def divide_text(string):
     
     return part1, part2, part3
 
+def handle_villager_interaction(villager_num, prompt, e_not_yet_pressed_flag, keys, villager_text, villager_text_surface, villager_text_rect):
+    if e_not_yet_pressed_flag and keys[pygame.K_e]:
+        overlay = pygame.Surface((screen_width, screen_height))
+        overlay.set_alpha(128)
+        overlay.fill((0, 0, 0))
+        screen.blit(overlay, (0, 0))
+        pygame.display.flip()
+
+        recognizer = sr.Recognizer()
+        with sr.Microphone() as source:
+            logging.info("Listening...")
+            audio = recognizer.listen(source)
+            try:
+                text = recognizer.recognize_google(audio)
+                logging.info(f'User said: {text}')
+
+                prompt = prompt.format(text=text)
+                logging.info(f'Prompt: {prompt}')
+
+                dialog_thread = threading.Thread(target=perform_speech, args=(prompt, villager_num))
+                dialog_thread.start()
+
+                return False
+            except Exception as e:
+                logging.error(e)
+                logging.error("No audio received")
+                return True
+    else:
+        x1, x2, x3 = divide_text(villager_text)
+        
+        villager_text_surface = font.render(x1, True, WHITE)
+        villager_text_rect = villager_text_surface.get_rect(center=(screen_width // 2, 530))
+
+        villager_text_surface_1 = font.render(x2, True, WHITE)
+        villager_text_rect_1 = villager_text_surface_1.get_rect(center=(screen_width // 2, 550))
+
+        villager_text_surface_2 = font.render(x3, True, WHITE)
+        villager_text_rect_2 = villager_text_surface_2.get_rect(center=(screen_width // 2, 570))
+
+        screen.blit(villager_text_surface, villager_text_rect)
+        screen.blit(villager_text_surface_1, villager_text_rect_1)
+        screen.blit(villager_text_surface_2, villager_text_rect_2)
+        
+    return e_not_yet_pressed_flag
+
 running = True
 walk_count = 0
 e_not_yet_pressed = True
@@ -151,7 +190,7 @@ def divide_text(string):
     
     fall(player_rect)
     for i in range(0, rep):
-        screen.blit(bg_img,(i*bg_img.get_width(),0))
+        screen.blit(bg_img, (i * bg_img.get_width(), 0))
     for event in pygame.event.get():
         if event.type == pygame.QUIT:
             running = False
@@ -175,148 +214,56 @@ def divide_text(string):
     screen.blit(check_point, check_point_rect)
 
     if isWalking:
-        screen.blit(player_image[walk_count%2], player_rect)
-        walk_count+=1
+        screen.blit(player_image[walk_count % 2], player_rect)
+        walk_count += 1
     else:
         screen.blit(player_image[0], player_rect)
 
     ######## Villager 1 ########
-    if player_rect.x<550 and player_rect.x>450:
+    if player_rect.x < 550 and player_rect.x > 450:
         info_image_rect.x = 510
         info_image_rect.y = 280
         if e_not_yet_pressed:
-            screen.blit(info_image[0],info_image_rect)
-        else:
-            screen.blit(info_image[1],info_image_rect)
-
-        if not e_not_yet_pressed:
-            x1,x2,x3 = divide_text(villager_text)
-            
-            villager_text_surface = font.render(x1, True, (255, 255, 255))
-            villager_text_rect = villager_text_surface.get_rect(center=(screen_width // 2, 530))
-
-            villager_text_surface_1 = font.render(x2, True, (255, 255, 255))
-            villager_text_rect_1 = villager_text_surface_1.get_rect(center=(screen_width // 2, 550))
-
-            villager_text_surface_2 = font.render(x3, True, (255, 255, 255))
-            villager_text_rect_2 = villager_text_surface_2.get_rect(center=(screen_width // 2, 570))
-
-            screen.blit(villager_text_surface, villager_text_rect)
-            screen.blit(villager_text_surface_1, villager_text_rect_1)
-            screen.blit(villager_text_surface_2, villager_text_rect_2)
+            screen.blit(info_image[0], info_image_rect)
         else:
-            villager_text_surface = font.render(villager_text, True, (255, 255, 255))
-            villager_text_rect = villager_text_surface.get_rect(center=(screen_width // 2, screen_height // 1.1))
-            screen.blit(villager_text_surface, villager_text_rect)
-        
-        if e_not_yet_pressed and keys[pygame.K_e]:
-            overlay = pygame.Surface((screen_width, screen_height))
-            overlay.set_alpha(128)
-            overlay.fill((0,0,0))
-            screen.blit(overlay, (0, 0))
-            pygame.display.flip()
-            
-            recognizer = sr.Recognizer()
-            with sr.Microphone() as source:
-                print("Listening...")
-                audio = recognizer.listen(source)
-                try:
-                    text = recognizer.recognize_google(audio)
-                    print(text)
+            screen.blit(info_image[1], info_image_rect)
 
-                    prompt = f'''Generate a dialog for game character that speaks in Shakespearean. This character knows location of checkpoint which is on right side of map. Only if a traveller asks about whereabouts of check point then mention character gives direction. Else character will talk about nice weather. If traveller says that he doesn't understand what he is saying then tell him to ask next villager
-                    Return the dialog in form of json {{dialog:<Character dialog>}}
-                    Traveller says: {text}
-                    '''
-                    print(prompt)
+        villager1_prompt = '''Generate a dialog for game character that speaks in Shakespearean. This character knows location of checkpoint which is on right side of map. Only if a traveller asks about whereabouts of check point then mention character gives direction. Else character will talk about nice weather. If traveller says that he doesn't understand what he is saying then tell him to ask next villager
+            Return the dialog in form of json {{dialog:<Character dialog>}}
+            Traveller says: {text}
+            '''
+        e_not_yet_pressed = handle_villager_interaction(0, villager1_prompt, e_not_yet_pressed, keys, villager_text, villager_text_surface, info_image_rect)
 
-                    dialog_thread = threading.Thread(target=perform_speech, args=(prompt,0))
-                    dialog_thread.start()
-
-                    e_not_yet_pressed = False
-                except Exception as e:
-                    print(e)
-                    print("No audio received")
-                    e_not_yet_pressed = True
-            
-    
     ######## Villager 2 ########
-    if player_rect.x<800 and player_rect.x>700:
+    if player_rect.x < 800 and player_rect.x > 700:
         info_image_rect.x = 750
         info_image_rect.y = 220
         if e_not_yet_pressed2:
-            screen.blit(info_image[0],info_image_rect)
+            screen.blit(info_image[0], info_image_rect)
         else:
-            screen.blit(info_image[1],info_image_rect)
-
-        if not e_not_yet_pressed2:
-            x1,x2,x3 = divide_text(villager2_text)
-            
-            villager2_text_surface = font.render(x1, True, (255, 255, 255))
-            villager2_text_rect = villager2_text_surface.get_rect(center=(screen_width // 2, 530))
+            screen.blit(info_image[1], info_image_rect)
 
-            villager2_text_surface_1 = font.render(x2, True, (255, 255, 255))
-            villager2_text_rect_1 = villager2_text_surface_1.get_rect(center=(screen_width // 2, 550))
-
-            villager2_text_surface_2 = font.render(x3, True, (255, 255, 255))
-            villager2_text_rect_2 = villager2_text_surface_2.get_rect(center=(screen_width // 2, 570))
-
-            screen.blit(villager2_text_surface, villager2_text_rect)
-            screen.blit(villager2_text_surface_1, villager2_text_rect_1)
-            screen.blit(villager2_text_surface_2, villager2_text_rect_2)
-        else:
-            villager2_text_surface = font.render(villager2_text, True, (255, 255, 255))
-            villager2_text_rect = villager2_text_surface.get_rect(center=(screen_width // 2, screen_height // 1.1))
-            
-            screen.blit(villager2_text_surface, villager2_text_rect)
-        
-        if e_not_yet_pressed2 and keys[pygame.K_e]:
-            overlay = pygame.Surface((screen_width, screen_height))
-            overlay.set_alpha(128)
-            overlay.fill((0,0,0))
-            screen.blit(overlay, (0, 0))
-            pygame.display.flip()
-            
-            recognizer = sr.Recognizer()
-            with sr.Microphone() as source:
-                print("Listening...")
-                audio = recognizer.listen(source)
-                try:
-                    text = recognizer.recognize_google(audio)
-                    print(text)
-
-                    prompt = f'''Generate a dialog for game character that speaks in GenZ lingo. This character knows location of checkpoint which is on right side of map. Only if a traveller asks about whereabouts of check point then mention character gives direction. Else character will talk about new tech she just discovered. Return the dialog in form of json {{dialog:<Character dialog>}}
-                    Traveller says: {text}
-                    '''
-                    print(prompt)
-
-                    dialog_thread = threading.Thread(target=perform_speech, args=(prompt,1))
-                    dialog_thread.start()
-
-                    e_not_yet_pressed2 = False
-                except Exception as e:
-                    print(e)
-                    print("No audio received")
-                    e_not_yet_pressed2 = True
-
-    
+        villager2_prompt = '''Generate a dialog for game character that speaks in GenZ lingo. This character knows location of checkpoint which is on right side of map. Only if a traveller asks about whereabouts of check point then mention character gives direction. Else character will talk about new tech she just discovered. Return the dialog in form of json {{dialog:<Character dialog>}}
+            Traveller says: {text}
+            '''
+        e_not_yet_pressed2 = handle_villager_interaction(1, villager2_prompt, e_not_yet_pressed2, keys, villager2_text, villager2_text_surface, info_image_rect)
 
     ######## Villager 3 ########
-    if player_rect.x<200 and player_rect.x>100:
+    if player_rect.x < 200 and player_rect.x > 100:
         info_image_rect.x = 150
         info_image_rect.y = 220
 
-        screen.blit(info_image[0],info_image_rect)
+        screen.blit(info_image[0], info_image_rect)
 
-        x1,x2,x3 = divide_text(villager3_text)
+        x1, x2, x3 = divide_text(villager3_text)
         
-        villager3_text_surface = font2.render(x1, True, (255, 255, 255))
+        villager3_text_surface = font2.render(x1, True, WHITE)
         villager3_text_rect = villager3_text_surface.get_rect(center=(screen_width // 2, 530))
 
-        villager3_text_surface_1 = font2.render(x2, True, (255, 255, 255))
+        villager3_text_surface_1 = font2.render(x2, True, WHITE)
         villager3_text_rect_1 = villager3_text_surface_1.get_rect(center=(screen_width // 2, 550))
         
-        villager3_text_surface_2 = font2.render(x3, True, (255, 255, 255))
+        villager3_text_surface_2 = font2.render(x3, True, WHITE)
         villager3_text_rect_2 = villager3_text_surface_2.get_rect(center=(screen_width // 2, 570))
 
         screen.blit(villager3_text_surface, villager3_text_rect)
@@ -326,35 +273,31 @@ def divide_text(string):
         if keys[pygame.K_e]:
             overlay = pygame.Surface((screen_width, screen_height))
             overlay.set_alpha(128)
-            overlay.fill((0,0,0))
+            overlay.fill((0, 0, 0))
             screen.blit(overlay, (0, 0))
             pygame.display.flip()
-            
+
             recognizer = sr.Recognizer()
             with sr.Microphone() as source:
-                print("Listening...")
+                logging.info("Listening...")
                 audio = recognizer.listen(source)
                 try:
                     text = recognizer.recognize_google(audio)
-                    print(text)
+                    logging.info(f'User said: {text}')
 
-                    prompt = f'''Generate a dialog for game character. This character tells us information about the game. Currently this is a prototype. The game is platform game in which we play using audio input using mic and move character using keys. The input is taken from the user and output is text and audio. Feels like talking with game character in real life. It tells us that this game generates dialog in realtime using LLM technology. Please keep explaination short and crisp. Return the dialog in form of json {{"dialog":<Character dialog>}}
+                    prompt = '''Generate a dialog for game character. This character tells us information about the game. Currently this is a prototype. The game is platform game in which we play using audio input using mic and move character using keys. The input is taken from the user and output is text and audio. Feels like talking with game character in real life. It tells us that this game generates dialog in realtime using LLM technology. Please keep explanation short and crisp. Return the dialog in form of json {{"dialog":<Character dialog>}}
                     Traveller says: {text}
                     '''
-                    print(prompt)
+                    logging.info(f'Prompt: {prompt}')
 
-                    dialog_thread = threading.Thread(target=perform_speech, args=(prompt,2))
+                    dialog_thread = threading.Thread(target=perform_speech, args=(prompt, 2))
                     dialog_thread.start()
                 except Exception as e:
-                    print(e)
-                    print("No audio received")
-
-    
+                    logging.error(e)
+                    logging.error("No audio received")
 
     pygame.display.flip()
-
     pygame.time.Clock().tick(60)
 
-
 pygame.quit()
 sys.exit()