<?xml version="1.0" encoding="utf-8" standalone="yes"?>
<rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom">
  <channel>
    <title>Audio on FOSS Engineer</title>
    <link>https://fossengineer.com/tags/audio/</link>
    <description>Recent content in Audio on FOSS Engineer</description>
    <generator>Hugo</generator>
    <language>en-US</language>
    <lastBuildDate>Sat, 06 Jun 2026 15:14:11 +0200</lastBuildDate>
    <atom:link href="https://fossengineer.com/tags/audio/index.xml" rel="self" type="application/rss+xml" />
    <item>
      <title>Voicebox - Local AI Voice Studio for Speech, Dictation, and Agents</title>
      <link>https://fossengineer.com/voicebox-local-ai-voice-studio/</link>
      <pubDate>Sat, 06 Jun 2026 10:50:00 +0200</pubDate>
      <guid>https://fossengineer.com/voicebox-local-ai-voice-studio/</guid>
      <description>&lt;strong&gt;Voicebox&lt;/strong&gt; is a local AI voice studio for cloning voices, generating speech, dictating into apps, transcribing captures, adding effects, composing stories, and giving AI agents voices through REST and MCP. It ships a Tauri desktop app, FastAPI backend, web UI, Docker setup, and multiple local TTS/STT engines.</description>
    </item>
    <item>
      <title>Voicebox</title>
      <link>https://fossengineer.com/apps/voicebox/</link>
      <pubDate>Sat, 06 Jun 2026 00:00:00 +0000</pubDate>
      <guid>https://fossengineer.com/apps/voicebox/</guid>
      <description>&lt;p&gt;Voicebox is a local AI voice studio with Docker support, REST endpoints, and MCP tools for giving agents a voice.&lt;/p&gt;</description>
    </item>
    <item>
      <title>Chatterbox - Local Open-Source Text-to-Speech by Resemble AI</title>
      <link>https://fossengineer.com/chatterbox-local-open-source-tts/</link>
      <pubDate>Fri, 05 Jun 2026 11:45:00 +0200</pubDate>
      <guid>https://fossengineer.com/chatterbox-local-open-source-tts/</guid>
      <description>&lt;strong&gt;Chatterbox&lt;/strong&gt; is Resemble AI&amp;rsquo;s MIT-licensed open-source text-to-speech toolkit. It ships Python APIs, Gradio demos, English and multilingual models, voice conversion, Turbo inference, paralinguistic tags, and built-in Perth watermarking. It is not a Docker-first self-hosted app; it is a local ML package where GPU access matters.</description>
    </item>
  </channel>
</rss>
