First commit from local working tree

2022-10-30 08:30:03 -07:00 · 2022-10-30 08:30:03 -07:00 · 32f0d1de88
commit 32f0d1de88
parent 86775d02f6
12 changed files with 832 additions and 2 deletions
--- a/main.pyw
+++ b/main.pyw
@ -0,0 +1,354 @@
+import array
+import config
+import os
+import pyaudio
+import random
+import typing
+import tkinter
+from tkinter import filedialog
+
+
+os.environ["PYGAME_HIDE_SUPPORT_PROMPT"] = "1"
+import pygame
+from pygame.locals import *
+
+
+__author__ = "Trysdyn Black"
+__license__ = "ACSL v1.4"
+__version__ = "1.0.0"
+__copyright__ = "Copyright 2022, Trysdyn Black"
+
+
+class Audio:
+    """Audio subsystem that monitors a microphone and determines avatar state.
+
+    Methods
+    -------
+    get_state() -> bool
+        Evaluate buffered audio data and return true if the average amplitude is over the configured threshold.
+        Indicates the mic is hot. Also drains the audio buffer.
+    """
+
+    def __init__(self, channels: int, rate: int, frames: int, threshold: int = 5000, smoothing: int = 0) -> None:
+        """
+        Parameters
+        ----------
+        channels : int
+            Number of audio channels in the input device, usually 1 or 2 for mono/stereo
+        rate : int
+            Baud rate of the audio device, typically 44100 or 48000 as configured in Windows
+        frames : int
+            Number of times a second to check the audio buffer. The buffer is fully drained each check
+        threshold : int
+            Audio amplitude at which we consider the mic hot
+        smoothing : int
+            Number of frames we continue to consider the mic hot after it stops being hot
+        """
+        p = pyaudio.PyAudio()
+        self.frames = frames
+        self.stream = p.open(
+            format=pyaudio.paInt16,
+            channels=channels,
+            rate=rate,
+            input=True,
+            frames_per_buffer=frames,
+        )
+
+        self.threshold = threshold
+        self.smoothing = smoothing
+        self.this_smooth = 0
+
+    def get_state(self) -> bool:
+        """Check audio buffer and indicate if the avatar's mouth should be open this frame.
+
+        Returns
+        -------
+        bool
+            Returns true if the avatar's mouth should be considered open this frame
+        """
+        # Grab a window of mic data into integer representations
+        data = self.stream.read(self.frames, exception_on_overflow=False)
+        a_data = array.array("h", data)
+
+        # Return true if we're over threshold or it's been fewer than smooth
+        # checks since the last time we were over threshold.
+        if max(a_data) > self.threshold:
+            self.this_smooth = self.smoothing
+            return True
+        elif self.this_smooth:
+            self.this_smooth -= 1
+            return True
+
+        return False
+
+
+class Tube:
+    """Encapsulates avatar and windowing logic, handles drawing.
+
+    Methods
+    -------
+    should_blink() -> bool
+        Evaluate all available settings and data and return true if the avatar should be blinking this frame.
+    update()
+        Perform one frame of checks, logic, and prep and draw the avatar.
+    """
+
+    def __init__(
+        self,
+        image_closed: str,
+        image_open: typing.Optional[str] = None,
+        image_blink_closed: typing.Optional[str] = None,
+        image_blink_open: typing.Optional[str] = None,
+        blink_chance: int = 0,
+        blink_frames: int = 0,
+        shake_intensity: int = 0,
+        shake_delay: int = 0,
+        win_size: typing.Optional[tuple] = None,
+        bg_color: tuple = (0, 255, 0),
+    ) -> None:
+        """
+        Parameters
+        ----------
+        image_closed : string
+            Filename for the image to load for a opened eyes/closed mouth avatar state.
+            Mandatory.
+        image_open : string or None
+            Filename for the image to load for a opened eyes/opened mouth avatar state.
+            Defaults to None.
+        image_blink_closed : string or None
+            Filename for the image to load for a closed eyes/closed mouth avatar state.
+            Defaults to None.
+        image_blink_open : string
+            Filename for the image to load for a closed eyes/opened mouth avatar state.
+            Defaults to None.
+        blink_chance : float
+            A chance, out of 1.0, to activate blinking each frame of rendering.
+            Defaults to 0 to disable blinking.
+        blink_frames : int
+            How many frames to hold the eyes-closed state after activating a blink.
+            Defaults to 0 to disable blinking.
+        shake_intensity : int
+            How far in pixels to limit movement on each axis when shaking.
+            Defaults to 0 to disable shaking.
+        shake_delay : int
+            How many frames to prevent shaking after completing a prior shake.
+            Defaults to 0.
+        win_size : tuple(int, int) or None
+            Window size as a tuple of ints (width, height).
+            Defaults to None, which uses the image size of image_closed instead.
+        bg_color : tuple(int, int, int)
+            Background color as a tuple of ints (red, green, blue).
+            Defaults to (0, 255, 0) for greenscreen green.
+        """
+        self.open_frames = 0
+        self.blinked_frames = 0
+
+        # These display settings are temporary. We can't load images without it
+        self.display = pygame.display.set_mode((400, 300))
+        pygame.display.set_caption("pyngtube")
+
+        # Closed mouth image is mandatory
+        self.image_closed = pygame.image.load(image_closed).convert_alpha()
+
+        # Open mouth image is optional
+        if image_open:
+            self.image_open = pygame.image.load(image_open).convert_alpha()
+        else:
+            self.image_open = None
+
+        # Blinking images are optional
+        if image_blink_closed:
+            self.image_blink_closed = pygame.image.load(image_blink_closed).convert_alpha()
+        else:
+            self.image_blink_closed = None
+
+        if image_blink_open:
+            self.image_blink_open = pygame.image.load(image_blink_open).convert_alpha()
+        else:
+            self.image_blink_open = None
+
+        # Establish our blink settings
+        self.blink_chance = blink_chance
+        self.blink_frames = blink_frames
+
+        # If we only have a closed-mouth image (why?) use it for open-mouth too
+        using_image_open = self.image_open if self.image_open else self.image_closed
+
+        # State map for which image to use. (Mouth Opened?, Blinked?)
+        # If we don't have blinked images, we use the non-blinked images for those slots
+        self.state_map = {
+            (False, False): self.image_closed,
+            (True, False): using_image_open,
+            (False, True): self.image_blink_closed if self.image_blink_closed else self.image_closed,
+            (True, True): self.image_blink_open if self.image_blink_open else using_image_open,
+        }
+
+        # If we specified a window size, use it. If not use closed image size
+        # Then we pad by 10px to allow for shaking
+        if not win_size:
+            win_size = self.image_closed.get_size()
+
+        self.win_size = (
+            win_size[0] + (shake_intensity * 2),
+            win_size[1] + (shake_intensity * 2),
+        )
+
+        # Background color to blank with, likely a greenscreen color
+        self.bg_color = bg_color
+
+        # Shaking intensity. Numer of frames to wait before shaking
+        self.shake_intensity = shake_intensity
+        self.shake_delay = shake_delay
+
+        # Create our drawing buffer and initialize true display size
+        self.buf = pygame.surface.Surface(self.image_closed.get_size())
+        self.display = pygame.display.set_mode(self.win_size, pygame.RESIZABLE)
+
+    def should_blink(self) -> bool:
+        """Check if we're currently blinking and check blink_chance to indicate if we should be blinking this frame.
+
+        Returns
+        -------
+        bool
+            Returns true if the avatar's eyes should be considered closed this frame.
+        """
+        # If we're blinking and haven't reached the configured blink duration yet
+        # extend blinking by a frame to keep the eyes shut.
+        # Otherwise roll blink chance and set blink if the roll wins.
+        if self.blinked_frames and self.blinked_frames < self.blink_frames:
+            self.blinked_frames += 1
+            return True
+        else:
+            if random.random() < self.blink_chance:
+                self.blinked_frames += 1
+                return True
+
+        self.blinked_frames = 0
+        return False
+
+    def update(self, opened: bool, blinked: bool) -> None:
+        """Perform updates and drawing for one frame. This should be called once a frame and fed avatar state info on
+           open mouth and blinking. This handles all the other placement, style, and drawing functions from there.
+
+        Parameters
+        ----------
+        opened : bool
+            true if the avatar's mouth should be open this frame.
+        blinked : bool
+            true if the avatar's eyes should be closed this frame.
+        """
+        # Blank with bg_color
+        self.display.fill(self.bg_color)
+        self.buf.fill(self.bg_color)
+
+        # Jitter tracks our offset from origin for shaking
+        # It's applied as a transformation to image location each frame
+        jitter = (0, 0)
+        i = self.shake_intensity
+
+        # Figure out which image we're drawing this frame using our state map
+        this_frame_image = self.state_map[(opened, blinked)]
+
+        # If the mic state is opened and an open mouth image exists, blit it
+        # to the drawing buffer. Otherwise use the closed mouth image.
+        if opened and self.image_open:
+            self.open_frames += 1
+
+            # Randomize our jitter if we're currently shaking
+            if self.shake_delay and not self.open_frames % self.shake_delay:
+                jitter = (random.randint(-i, i), random.randint(-i, i))
+        else:
+            self.open_frames = 0
+            jitter = (0, 0)
+
+        # Draw our chosen image to a drawing buffer
+        self.buf.blit(this_frame_image, (0, 0))
+
+        # Resize the drawing buffer to the window size if necessary
+        # Scale on the vertical axis to maximum window size.
+        # If we're configured to shake the sprite on open mic, randomly
+        # jitter the sprite around the frame a bit while mic is open.
+        display_size = self.display.get_size()
+        shrunk_size = (display_size[0] - (i * 2), display_size[1] - (i * 2))
+        if self.buf.get_size() != shrunk_size:
+            new_buf = pygame.transform.scale(self.buf, shrunk_size)
+            self.display.blit(new_buf, (i + jitter[0], i + jitter[1]))
+        else:
+            self.display.blit(self.buf, (i + jitter[0], i + jitter[1]))
+
+        pygame.display.flip()
+
+
+if __name__ == "__main__":
+    # Hide Pygame "Hello world" stuff. Why does this require an envvar :/
+
+    # I use some not-great extreme shorthand in the main loop here:
+    # c = config object
+    # a = audio subsystem object
+    # t = pngtube object, the window and avatar object
+    quit = False
+    rehash = True
+    root = tkinter.Tk()
+    root.withdraw()
+    pygame.init()
+
+    # Load config
+    c = config.Config()
+
+    # Initialize audio system
+    a = Audio(
+        channels=2 if c.mic_stereo else 1,
+        rate=c.mic_rate,
+        frames=int(c.mic_rate / c.audio_checks),
+        threshold=c.threshold,
+        smoothing=c.smoothing,
+    )
+
+    while not quit:
+        # Reload our avatar if we've been instructed to rehash settings
+        if rehash:
+            t = Tube(
+                image_closed=c.image_closed,
+                image_open=c.image_open,
+                image_blink_closed=c.image_blink_closed,
+                image_blink_open=c.image_blink_open,
+                blink_chance=c.blink_chance,
+                blink_frames=c.blink_frames,
+                bg_color=c.bg_color,
+                shake_delay=c.shake_delay,
+                shake_intensity=c.shake_intensity,
+            )
+            rehash = False
+        for event in pygame.event.get():
+            # Clean shutdown if user clicks the [X]
+            if event.type == QUIT:
+                pygame.quit()
+                a.stream.close()
+                quit = True
+                break
+            # If the window gets resized, handle redrawing the window in the new size
+            elif event.type == pygame.VIDEORESIZE:
+                # Scale only on vertical axis. Force horizontal axis to match
+                # the drawing buffer's aspect ratio.
+                win_size = (event.w, event.h)
+                buf_ratio = t.buf.get_width() / t.buf.get_height()
+                t.win_size = (win_size[1] * buf_ratio, win_size[1])
+                t.display = pygame.display.set_mode(t.win_size, pygame.RESIZABLE)
+            # Mouse wheel up and down changes mic threshold.
+            # TODO: Provide some kind of user feedback
+            #       But I don't want it visible in the capture region
+            elif event.type == pygame.MOUSEWHEEL:
+                a.threshold += event.y * 100
+                print(a.threshold)
+            # RMB to open load file dialog for profile
+            elif event.type == pygame.MOUSEBUTTONDOWN:
+                if event.button == 3:
+                    file_types = [("yaml files", "profile.yaml")]
+                    file_path = filedialog.askopenfilename(title="Select a profile", filetypes=file_types)
+                    if file_path:
+                        c.profile = os.path.dirname(file_path)
+                        rehash = True
+
+        # Check mic, update image
+        if not quit:
+            t.update(a.get_state(), t.should_blink())