lukmay · phoenixray2000 · May 18, 2026 · May 18, 2026 · May 18, 2026 · May 18, 2026
diff --git a/README.md b/README.md
@@ -17,14 +17,18 @@ It sits quietly in your system tray and is always ready with a single click or g
     -   🎤 **Microphone:** Record your voice.
     -   🔊 **System Audio:** Record what you hear (Loopback).
     -   🎙️+🔊 **Both:** Record both tracks simultaneously (mixed).
+-   **Output Profiles:**
+    -   **Format:** Save recordings as WAV, FLAC, or MP3.
+    -   **Quality:** Choose Balanced for compact 16 kHz output or High Quality for 48 kHz output.
+    -   **Stereo:** Keep stereo channels when needed, or leave it off for mono recordings.
 -   **Post-Processing:**
-    -   **Auto-Normalize:** Automatically adjusts volume to optimal levels after recording.
+    -   **Auto-Normalize:** Lifts the main voice/body of each source before mixing and limits sharp peaks so brief spikes do not bury the recording.
     -   **Clipboard Integration:** Automatically copies the file (or file path) to your clipboard.
     -   **Clean Workflow:** Option to move the file to a temp folder and copy it, keeping your desktop clean.
 -   **Control:**
     -   **Global Hotkeys:** Start/Stop recording from anywhere (e.g., `Ctrl+Alt+R`).
-    -   **Tray Icon:** Left-click to toggle recording immediately.
-    -   **Visual Feedback:** Tray icon changes color when recording.
+    -   **Tray Icon:** Left-click to toggle recording immediately; right-click to open the recordings folder, settings, or exit.
+    -   **Visual Feedback:** Tray icon changes color when recording, and an optional always-on-top floating timer shows recording status with the same right-click menu.
 
 ## Installation
 
@@ -35,10 +39,11 @@ It sits quietly in your system tray and is always ready with a single click or g
 ## Usage
 
 1.  **Right-click** the tray icon to open **Settings**.
-2.  Select your **Microphone** and **Output Folder**.
+2.  Select your **Microphone**, **Output Folder**, **Format**, **Quality**, and **Stereo** preference.
 3.  Set your **Hotkeys** (optional).
+    - Disable **Show floating recording timer** if you do not want the compact always-on-top recording indicator.
 4.  **Left-click** the tray icon or use a hotkey to start recording.
-5.  Click again to stop. The file is saved and ready to use!
+5.  Click the tray icon again, use a stop hotkey, or click the floating timer to stop. The floating timer changes state immediately, then hides after 5 seconds; click it again before it hides to open the recordings folder.
 
 ## Development
 

diff --git a/audio_recorder.py b/audio_recorder.py
@@ -6,24 +6,109 @@
 import lameenc
 import numpy as np
 import tempfile
-import shutil
+
+FORMAT_CONFIG = {
+    "wav": {
+        "label": "WAV",
+        "extension": ".wav",
+        "encoder": "soundfile",
+        "format": "WAV",
+    },
+    "flac": {
+        "label": "FLAC",
+        "extension": ".flac",
+        "encoder": "soundfile",
+        "format": "FLAC",
+    },
+    "mp3": {
+        "label": "MP3",
+        "extension": ".mp3",
+        "encoder": "lameenc",
+    },
+}
+
+QUALITY_CONFIG = {
+    "balanced": {
+        "label": "Balanced",
+        "sample_rate": 16000,
+        "subtype": "PCM_16",
+        "mp3_bitrate_kbps": 64,
+    },
+    "high": {
+        "label": "High Quality",
+        "sample_rate": 48000,
+        "subtype": "PCM_24",
+        "mp3_bitrate_kbps": 128,
+    },
+}
+
+NORMALIZE_ACTIVE_FLOOR = 0.001
+NORMALIZE_TARGET_LEVEL = 0.12
+NORMALIZE_MAX_GAIN = 8.0
+NORMALIZE_REFERENCE_PERCENTILE = 95
+NORMALIZE_LIMIT = 0.98
+
+
+def build_output_profile(fmt, quality, stereo):
+    fmt_key = str(fmt or "").strip().lower()
+    quality_key = str(quality or "").strip().lower()
+
+    if fmt_key not in FORMAT_CONFIG:
+        raise ValueError(f"Unsupported output format: {fmt}")
+    if quality_key not in QUALITY_CONFIG:
+        raise ValueError(f"Unsupported output quality: {quality}")
+
+    format_config = FORMAT_CONFIG[fmt_key]
+    quality_config = QUALITY_CONFIG[quality_key]
+    channels = 2 if stereo else 1
+    return {
+        **quality_config,
+        **format_config,
+        "label": format_config["label"],
+        "format_label": format_config["label"],
+        "quality_label": quality_config["label"],
+        "format_key": fmt_key,
+        "quality_key": quality_key,
+        "channels": channels,
+    }
+
+
+def describe_output_profile(fmt, quality, stereo):
+    profile = build_output_profile(fmt, quality, stereo)
+    rate_khz = profile["sample_rate"] // 1000
+    channels = "stereo" if profile["channels"] == 2 else "mono"
+    encoding = (
+        f"{profile['mp3_bitrate_kbps']} kbps"
+        if profile["encoder"] == "lameenc"
+        else profile["subtype"]
+    )
+    return f"{profile['format_label']} / {rate_khz} kHz / {channels} / {encoding}"
+
 
 class RawRecorder(threading.Thread):
     """
     Helper thread to record a single device to a WAV file.
     """
-    def __init__(self, device, filepath, samplerate=44100, channels=2):
+    def __init__(self, device, filepath, samplerate=44100, channels=2, subtype="PCM_16"):
         super().__init__()
         self.device = device
         self.filepath = filepath
         self.samplerate = samplerate
         self.channels = channels
+        self.subtype = subtype
         self.stop_event = threading.Event()
         self.error = None
 
     def run(self):
         try:
-            with sf.SoundFile(self.filepath, mode='w', samplerate=self.samplerate, channels=self.channels) as f_wav:
+            with sf.SoundFile(
+                self.filepath,
+                mode="w",
+                samplerate=self.samplerate,
+                channels=self.channels,
+                format="WAV",
+                subtype=self.subtype,
+            ) as f_wav:
                 with self.device.recorder(samplerate=self.samplerate, channels=self.channels) as mic:
                     while not self.stop_event.is_set():
                         data = mic.record(numframes=2048)
@@ -39,13 +124,25 @@ class AudioRecorder(threading.Thread):
     """
     Orchestrates recording from Microphone, Loopback, or Both.
     """
-    def __init__(self, mic_id, source_mode, output_folder, output_format="mp3", 
-                 normalize=False, on_finish_callback=None):
+    def __init__(
+        self,
+        mic_id,
+        source_mode,
+        output_folder,
+        output_format="flac",
+        quality="balanced",
+        stereo=False,
+        normalize=False,
+        on_finish_callback=None,
+    ):
         super().__init__()
         self.mic_id = mic_id
         self.source_mode = source_mode # "mic", "loopback", "both"
         self.output_folder = output_folder
-        self.output_format = output_format.lower()
+        self.output_format = str(output_format or "flac").strip().lower()
+        self.quality = str(quality or "balanced").strip().lower()
+        self.stereo = bool(stereo)
+        self.profile = build_output_profile(self.output_format, self.quality, self.stereo)
         self.normalize = normalize
         self.callback = on_finish_callback
 
@@ -82,6 +179,10 @@ def run(self):
         self.recorders = []
 
         try:
+            samplerate = self.profile["sample_rate"]
+            channels = self.profile["channels"]
+            subtype = self.profile["subtype"]
+
             # 1. Setup Recorders
             if self.source_mode == "both":
                 # Need two recorders
@@ -92,20 +193,20 @@ def run(self):
                 t2 = tempfile.NamedTemporaryFile(suffix=".wav", delete=False).name
                 self.temp_files = [t1, t2]
 
-                self.recorders.append(RawRecorder(dev_mic, t1))
-                self.recorders.append(RawRecorder(dev_loop, t2))
+                self.recorders.append(RawRecorder(dev_mic, t1, samplerate=samplerate, channels=channels, subtype=subtype))
+                self.recorders.append(RawRecorder(dev_loop, t2, samplerate=samplerate, channels=channels, subtype=subtype))
 
             elif self.source_mode == "loopback":
                 dev = self._get_device(is_loopback=True)
                 t1 = tempfile.NamedTemporaryFile(suffix=".wav", delete=False).name
                 self.temp_files = [t1]
-                self.recorders.append(RawRecorder(dev, t1))
+                self.recorders.append(RawRecorder(dev, t1, samplerate=samplerate, channels=channels, subtype=subtype))
 
             else: # mic
                 dev = self._get_device(is_loopback=False)
                 t1 = tempfile.NamedTemporaryFile(suffix=".wav", delete=False).name
                 self.temp_files = [t1]
-                self.recorders.append(RawRecorder(dev, t1))
+                self.recorders.append(RawRecorder(dev, t1, samplerate=samplerate, channels=channels, subtype=subtype))
 
             print(f"Starting recording mode: {self.source_mode}")
 
@@ -123,31 +224,16 @@ def run(self):
                     raise Exception(f"Recorder error: {r.error}")
 
             # 4. Mix/Process
-            if len(self.temp_files) == 2:
-                mixed_wav = tempfile.NamedTemporaryFile(suffix=".wav", delete=False).name
-                self._mix_audio(self.temp_files[0], self.temp_files[1], mixed_wav)
-                # Use mixed file as source for next steps
-                source_wav = mixed_wav
-                self.temp_files.append(mixed_wav) # Mark for cleanup
-            else:
-                source_wav = self.temp_files[0]
-
-            # 5. Normalization
-            if self.normalize:
-                self._normalize_audio(source_wav)
+            source_wav = self._prepare_source_wav(subtype)
 
             # 6. Finalize
             if not os.path.exists(self.output_folder):
                 os.makedirs(self.output_folder)
 
             timestamp = time.strftime("%Y%m%d_%H%M%S")
-            filename = f"Recording_{timestamp}.{self.output_format}"
+            filename = f"Recording_{timestamp}{self.profile['extension']}"
             self.final_filepath = os.path.join(self.output_folder, filename)
-
-            if self.output_format == "mp3":
-                self._convert_to_mp3(source_wav, self.final_filepath)
-            else:
-                shutil.copy2(source_wav, self.final_filepath)
+            self._write_final_output(source_wav, self.final_filepath)
 
         except Exception as e:
             self.error_message = str(e)
@@ -167,9 +253,40 @@ def run(self):
     def stop(self):
         self.stop_event.set()
 
-    def _mix_audio(self, file1, file2, out_file):
-        d1, sr1 = sf.read(file1)
-        d2, sr2 = sf.read(file2)
+    def _prepare_source_wav(self, subtype):
+        if len(self.temp_files) == 2:
+            if self.normalize:
+                self._normalize_audio(self.temp_files[0])
+                self._normalize_audio(self.temp_files[1])
+
+            mixed_wav = tempfile.NamedTemporaryFile(suffix=".wav", delete=False).name
+            self._mix_audio(
+                self.temp_files[0],
+                self.temp_files[1],
+                mixed_wav,
+                subtype,
+                limit_output=self.normalize,
+            )
+            self.temp_files.append(mixed_wav) # Mark for cleanup
+
+            if self.normalize:
+                self._limit_audio(mixed_wav)
+
+            return mixed_wav
+
+        source_wav = self.temp_files[0]
+        if self.normalize:
+            self._normalize_audio(source_wav)
+        return source_wav
+
+    def _mix_audio(self, file1, file2, out_file, subtype, limit_output=False):
+        d1, sr1 = sf.read(file1, always_2d=True)
+        d2, sr2 = sf.read(file2, always_2d=True)
+
+        if sr1 != sr2:
+            raise ValueError("Cannot mix audio with different sample rates.")
+        if d1.shape[1] != d2.shape[1]:
+            raise ValueError("Cannot mix audio with different channel counts.")
 
         # Ensure same length
         max_len = max(len(d1), len(d2))
@@ -178,42 +295,83 @@ def _mix_audio(self, file1, file2, out_file):
         if len(d1) < max_len:
             pad_width = max_len - len(d1)
             # handle mono/stereo padding
-            shape = (pad_width, d1.shape[1]) if d1.ndim > 1 else (pad_width,)
+            shape = (pad_width, d1.shape[1])
             d1 = np.concatenate((d1, np.zeros(shape, dtype=d1.dtype)))
 
         # Pad d2
         if len(d2) < max_len:
             pad_width = max_len - len(d2)
-            shape = (pad_width, d2.shape[1]) if d2.ndim > 1 else (pad_width,)
+            shape = (pad_width, d2.shape[1])
             d2 = np.concatenate((d2, np.zeros(shape, dtype=d2.dtype)))
 
-        # Mix (Sum)
         mixed = d1 + d2
-        # Clip
-        mixed = np.clip(mixed, -1.0, 1.0)
+        if limit_output:
+            mixed = self._apply_limiter(mixed)
+        else:
+            mixed = np.clip(mixed, -1.0, 1.0)
 
-        sf.write(out_file, mixed, sr1) # Assume sr1 == sr2 = 44100
+        sf.write(out_file, mixed, sr1, format="WAV", subtype=subtype)
 
     def _normalize_audio(self, filepath):
         try:
-            data, sr = sf.read(filepath)
-            max_val = np.max(np.abs(data))
-            if max_val > 0:
-                target_peak = 0.99 
-                factor = target_peak / max_val
-                data = data * factor
-                sf.write(filepath, data, sr)
+            info = sf.info(filepath)
+            data, sr = sf.read(filepath, always_2d=True)
+            data = self._normalize_audio_data(data)
+            sf.write(filepath, data, sr, format=info.format, subtype=info.subtype)
         except Exception as e:
             print(f"Normalization failed: {e}")
 
-    def _convert_to_mp3(self, src_wav, dst_mp3):
-        data, sr = sf.read(src_wav)
-        channels = data.shape[1] if data.ndim > 1 else 1
+    def _normalize_audio_data(self, data):
+        active = np.abs(data)
+        active = active[active >= NORMALIZE_ACTIVE_FLOOR]
+        if active.size == 0:
+            return self._apply_limiter(data)
+
+        rms = float(np.sqrt(np.mean(active ** 2)))
+        percentile = float(np.percentile(active, NORMALIZE_REFERENCE_PERCENTILE))
+        reference_level = max(rms, percentile)
+        if not np.isfinite(reference_level) or reference_level <= 0:
+            return self._apply_limiter(data)
+
+        gain = min(NORMALIZE_TARGET_LEVEL / reference_level, NORMALIZE_MAX_GAIN)
+        return self._apply_limiter(data * gain)
+
+    def _limit_audio(self, filepath):
+        info = sf.info(filepath)
+        data, sr = sf.read(filepath, always_2d=True)
+        data = self._apply_limiter(data)
+        sf.write(filepath, data, sr, format=info.format, subtype=info.subtype)
+
+    def _apply_limiter(self, data):
+        return np.clip(data, -NORMALIZE_LIMIT, NORMALIZE_LIMIT)
+
+    def _write_final_output(self, source_wav, final_filepath):
+        if self.profile["encoder"] == "lameenc":
+            self._convert_to_mp3(source_wav, final_filepath, self.profile["mp3_bitrate_kbps"])
+            return
+
+        data, sr = sf.read(source_wav, always_2d=True)
+        if self.profile["channels"] == 1 and data.shape[1] > 1:
+            data = np.mean(data, axis=1, keepdims=True)
+
+        sf.write(
+            final_filepath,
+            data,
+            sr,
+            format=self.profile["format"],
+            subtype=self.profile["subtype"],
+        )
+
+    def _convert_to_mp3(self, src_wav, dst_mp3, bitrate_kbps):
+        data, sr = sf.read(src_wav, always_2d=True)
+        if self.profile["channels"] == 1 and data.shape[1] > 1:
+            data = np.mean(data, axis=1, keepdims=True)
+        channels = data.shape[1]
 
         pcm_data = (data * 32767).clip(-32768, 32767).astype(np.int16)
 
         encoder = lameenc.Encoder()
-        encoder.set_bit_rate(192)
+        encoder.set_bit_rate(bitrate_kbps)
         encoder.set_in_sample_rate(sr)
         encoder.set_channels(channels)
         encoder.set_quality(2)