speaches-ai · fedirz · Mar 6, 2025 · Mar 3, 2025 · Mar 3, 2025 · Mar 6, 2025
diff --git a/contributing.md b/contributing.md
@@ -0,0 +1,3 @@
+uv venv
+source .venv/bin/activate
+uv sync --all-extras
diff --git a/docs/usage/text-to-speech.md b/docs/usage/text-to-speech.md
@@ -1,7 +1,3 @@
-!!! warning
-
-    `rhasspy/piper-voices` is only supported on x86_64. I was unable to build [piper-phonemize](https://github.com/rhasspy/piper-phonemize) for ARM. If you have experience building Python packages with third-party C++ dependencies, please consider contributing. See [#234](https://github.com/speaches-ai/speaches/issues/234) for more information.
-
 !!! note
 
     Before proceeding, you should be familiar with the [OpenAI Text-to-Speech](https://platform.openai.com/docs/guides/text-to-speech) and the relevant [OpenAI API reference](https://platform.openai.com/docs/api-reference/audio/createSpeech)

diff --git a/pyproject.toml b/pyproject.toml
@@ -8,10 +8,10 @@ dependencies = [
     "fastapi>=0.115.6",
     "faster-whisper>=1.1.1",
     "huggingface-hub[hf-transfer]>=0.25.1",
-    "kokoro-onnx[gpu]>=0.4.2,<0.5.0",
+    "kokoro-onnx[gpu]>=0.4.5,<0.5.0",
     "numpy>=2.1.1",
-    "piper-phonemize ; platform_machine == 'x86_64'",
-    "piper-tts>=1.2.0 ; platform_machine == 'x86_64'",
+    "piper-phonemize ; sys_platform == 'linux'",
+    "piper-tts>=1.2.0 ; sys_platform == 'linux'",
     "pydantic-settings>=2.5.2",
     "pydantic>=2.10.0",
     "python-multipart>=0.0.10",
@@ -148,11 +148,12 @@ markers = [
 
 [tool.uv]
 constraint-dependencies = ["llvmlite>=0.40.0"]
-# TODO: create an issue on https://github.com/thewh1teagle/kokoro-onnx regarding this
-override-dependencies = ["onnxruntime-gpu>=1.20.1 ; platform_machine == 'x86_64'"]
 
 [tool.uv.sources]
-piper-phonemize = { url = "https://github.com/fedirz/piper-phonemize/raw/refs/heads/master/dist/piper_phonemize-1.2.0-cp312-cp312-manylinux_2_28_x86_64.whl" }
+piper-phonemize = [
+  { url = "https://github.com/fedirz/piper-phonemize/raw/refs/heads/master/dist/piper_phonemize-1.2.0-cp312-cp312-manylinux_2_28_aarch64.whl", marker = "platform_machine == 'aarch64' and sys_platform == 'linux'" },
+  { url = "https://github.com/fedirz/piper-phonemize/raw/refs/heads/master/dist/piper_phonemize-1.2.0-cp312-cp312-manylinux_2_28_x86_64.whl", marker = "platform_machine == 'x86_64' and sys_platform == 'linux'" },
+]
 
 [[tool.uv.dependency-metadata]]
 name = "piper-tts"

diff --git a/src/speaches/main.py b/src/speaches/main.py
@@ -1,7 +1,6 @@
 from __future__ import annotations
 
 import logging
-import platform
 
 from fastapi import (
     FastAPI,
@@ -59,9 +58,6 @@ def create_app() -> FastAPI:
 
     logger.debug(f"Config: {config}")
 
-    if platform.machine() != "x86_64":
-        logger.warning("`POST /v1/audio/speech` with `model=rhasspy/piper-voices` is only supported on x86_64 machines")
-
     dependencies = []
     if config.api_key is not None:
         dependencies.append(ApiKeyDependency)

diff --git a/tests/speech_test.py b/tests/speech_test.py
@@ -1,15 +1,10 @@
 import io
-import platform
 
 from openai import AsyncOpenAI, UnprocessableEntityError
 import pytest
 import soundfile as sf
 
-platform_machine = platform.machine()
-if platform_machine != "x86_64":
-    pytest.skip("Only supported on x86_64", allow_module_level=True)
-
-from speaches.routers.speech import (  # noqa: E402
+from speaches.routers.speech import (
     DEFAULT_MODEL_ID,
     DEFAULT_RESPONSE_FORMAT,
     DEFAULT_VOICE_ID,