{ "$schema": "https://huggingface.co/FatalErrorVXD/ltx-desktop-assets/raw/main/manifest.schema.json", "manifest_version": "0.1.0", "ltx_desktop_min_version": "0.14.5", "updated_at": "2026-06-06", "license_envelope": "non-commercial", "consent_screen": { "intro": "LTX Desktop bundles several open-source AI models with different license terms. Please review and accept each before installation continues. LTX Desktop is a non-commercial application; if you plan to use it for revenue-generating work, do not accept these terms — contact each model's vendor for a commercial license.", "licenses": [ { "id": "fish-audio-research", "display_name": "Fish Audio S2-Pro — Fish Audio Research License", "summary": "Text-to-speech model. Research and non-commercial use only. Attribution required.", "full_text_path": "fish-audio/LICENSE.md", "applies_to": ["fish-audio"] }, { "id": "qwen-image-edit-cc-by-nc-sa", "display_name": "Qwen-Image-Edit-2511 (4-bit) — CC-BY-NC-SA-4.0", "summary": "Image editing model (4-bit quantization). Non-commercial use only. Attribution + share-alike required.", "full_text_path": "qwen-edit/LICENSE", "applies_to": ["qwen-edit"] }, { "id": "cocktail-fork-mit", "display_name": "Cocktail-Fork MRX — MIT License", "summary": "Audio source separation (speech / music / SFX). Permissive MIT license — commercial use permitted with attribution. Copyright (c) 2023 Mitsubishi Electric Research Laboratories (MERL).", "full_text_path": null, "applies_to": ["cocktail-fork-mrx"] }, { "id": "stable-audio-community", "display_name": "Stable Audio 3 Small-SFX — Stability AI Community License", "summary": "Sound-effects / foley generation model. Free for research and non-commercial use; commercial use only under Stability AI's Community License revenue threshold. Attribution required. HF-GATED: you must be logged in to Hugging Face and accept the license at huggingface.co/stabilityai/stable-audio-3-small-sfx before this can install.", "full_text_path": null, "applies_to": ["stable-audio-sfx"] }, { "id": "gemma-terms", "display_name": "T5Gemma (Stable Audio text encoder) — Google Gemma Terms of Use", "summary": "Stable Audio Small-SFX bundles Google's T5Gemma (t5gemma-b-b-ul2) for text conditioning, redistributed under the Gemma Terms of Use (Section 3.2 use restrictions apply). HF-GATED: accept at huggingface.co/google/t5gemma-b-b-ul2.", "full_text_path": null, "applies_to": ["stable-audio-sfx"] }, { "id": "mmaudio-noncommercial", "display_name": "MMAudio V2A — MIT code, non-commercial weights", "summary": "Video-to-audio foley model (Sony AI / UIUC, CVPR 2025). Code is MIT. Pretrained weights were trained on AudioSet / VGGSound / Freesound / AudioCaps / WavCaps — the authors do NOT guarantee commercial-use suitability; use at your own risk. Source: github.com/SonyResearch/MMAudio", "full_text_path": null, "applies_to": ["mmaudio-foley"] }, { "id": "bundled-git-gpl2", "display_name": "MinGit (Git for Windows) — GPL-2.0", "summary": "Portable Git binary bundled with LTX Desktop so component setup scripts (e.g. cocktail-fork, ace-step) can clone source repositories without the user installing Git for Windows separately. Distributed unmodified under GPL-2.0. Source: https://github.com/git-for-windows/git", "full_text_path": null, "applies_to": [] }, { "id": "bundled-git-lfs-mit", "display_name": "Git LFS — MIT License", "summary": "Git Large File Storage extension bundled alongside MinGit for components that ship pretrained checkpoints via LFS (e.g. cocktail-fork MRX checkpoints). Distributed unmodified under MIT. Source: https://github.com/git-lfs/git-lfs", "full_text_path": null, "applies_to": [] }, { "id": "ltx-desktop-eula", "display_name": "LTX Desktop End-User License", "summary": "The LTX Desktop application itself.", "full_text_path": null, "applies_to": [] } ] }, "components": [ { "id": "fish-audio-s2-pro", "display_name": "Fish Audio S2-Pro (TTS)", "required": false, "default_install": true, "license_refs": ["fish-audio-research"], "source": { "type": "hf-mirror", "repo": "FatalErrorVXD/ltx-desktop-assets", "subpath": "fish-audio/s2-pro/" }, "approx_bytes": 11000000000, "install_dir_env": "FISH_MODEL_DIR", "setup_script": "fish_audio_setup.py", "uploaded_at": "2026-05-23" }, { "id": "qwen-image-edit-2511-4bit", "display_name": "Qwen-Image-Edit-2511 4-bit (image editing)", "required": false, "default_install": true, "license_refs": ["qwen-image-edit-cc-by-nc-sa"], "source": { "type": "hf-mirror", "repo": "FatalErrorVXD/ltx-desktop-assets", "subpath": "qwen-edit/model/" }, "approx_bytes": 15000000000, "install_dir_env": "QWEN_MODEL_DIR", "setup_script": "qwen_edit_setup.py", "uploaded_at": "2026-05-23" }, { "id": "ace-step", "display_name": "ACE-Step (music generation)", "required": false, "default_install": true, "license_refs": [], "source": { "type": "upstream-hf", "repo": "ACE-Step/Ace-Step1.5", "revision": "TODO-pin-sha" }, "approx_bytes": 23000000000, "install_dir_env": "ACE_MODEL_DIR", "setup_script": "ace_step_setup.py", "_status": "upstream-pin-pending" }, { "id": "whisper-cpp-large-v3", "display_name": "Whisper.cpp large-v3 (transcription)", "required": false, "default_install": true, "license_refs": [], "source": { "type": "upstream-hf", "repo": "ggerganov/whisper.cpp", "file": "ggml-large-v3.bin" }, "approx_bytes": 3094623552, "install_dir_env": "WHISPER_MODEL_DIR", "setup_script": "whisper_setup.py" }, { "id": "cocktail-fork-mrx", "display_name": "Cocktail-Fork MRX (audio demixer)", "required": false, "default_install": true, "license_refs": ["cocktail-fork-mit"], "source": { "type": "upstream-git", "repo": "https://github.com/merlresearch/cocktail-fork-separation", "revision": "19b3de827ebc4bfb014570cf92dd32b4ee3b6921" }, "approx_bytes": 466000000, "install_dir_env": "COCKTAIL_FORK_DIR", "setup_script": "cocktail_fork_setup.py" }, { "id": "stable-audio-sfx", "display_name": "Stable Audio Small-SFX (foley / SFX synth)", "author": "Stability AI", "canonical_source": "https://github.com/Stability-AI/stable-audio-3", "required": false, "default_install": true, "license_refs": ["stable-audio-community", "gemma-terms"], "license_note": "UNGATED via mirror. The setup clones stable-audio-3, uv-syncs a Python 3.10 venv, redirects the model repo-id to the ungated LTX mirror FatalErrorVXD/stable-audio-3-small-sfx (which bundles the T5Gemma text encoder; SAME-S piggybacks on the checkpoint), and pulls ~3.3 GB with NO Hugging Face login or license acceptance required. The Stability Community + Gemma terms are still surfaced on this consent screen (required by redistribution). CPU-resident (no GPU). Powers the generate_sfx MCP tool.", "source": { "type": "upstream-git", "repo": "https://github.com/Stability-AI/stable-audio-3" }, "approx_bytes": 3500000000, "install_dir_env": "SA_REPO_DIR", "setup_script": "stable_audio_setup.py" }, { "id": "mmaudio-foley", "display_name": "MMAudio V2A (auto-synced foley)", "author": "Sony AI / UIUC", "canonical_source": "https://github.com/SonyResearch/MMAudio", "required": false, "default_install": false, "license_refs": ["mmaudio-noncommercial"], "license_note": "Ungated. The setup clones MMAudio, makes a Python 3.11 venv with CUDA torch, pins huggingface_hub==0.26.5 (BigVGAN compat), and pulls the large_44k_v2 weights (~4.1 GB). GPU ~6 GB at runtime. Powers the generate_foley MCP tool.", "source": { "type": "upstream-git", "repo": "https://github.com/SonyResearch/MMAudio" }, "approx_bytes": 7000000000, "install_dir_env": "MM_REPO_DIR", "setup_script": "mmaudio_setup.py" }, { "id": "qwen3-vl-qc-llamacpp", "display_name": "Qwen3.6-VL Visual QC (in-process)", "required": false, "default_install": true, "license_refs": [], "source": { "type": "hf-direct", "repo": "HauhauCS/Qwen3.6-27B-Uncensored-HauhauCS-Balanced", "revision": "9a28c2fbd15f21fb8ed204074c6f58d5bc889941", "files": [ "Qwen3.6-27B-Uncensored-HauhauCS-Balanced-IQ4_XS.gguf", "mmproj-Qwen3.6-27B-Uncensored-HauhauCS-Balanced-f16.gguf" ], "_note": "v0.16.0+: in-process via llama-cpp-python (JamePeng cu128 wheel). Replaces the v0.15.x Ollama path so installs leave no third-party software, no system-tray icon, and no Apps & Features entry. Same uncensored Qwen3.6-27B-VL IQ4_XS model — just pulled direct from HauhauCS on HF instead of via Ollama." }, "approx_bytes": 16000000000, "install_dir_env": "QWEN_VL_ROOT", "setup_script": "qwen_vl_qc_setup.py" }, { "id": "loras-ltx-crisp-enhance", "display_name": "LTX 2.3 Crisp Enhance (stacked LoRA)", "author": "vrgamedevgirl", "canonical_source": "https://civitai.com/models/2535622/ltx-23-enhancers?modelVersionId=2849716", "required": false, "default_install": true, "license_refs": [], "license_note": "Inherits creator-set permissions on the CivitAI page above. Mirrored here for non-commercial use within LTX Desktop.", "source": { "type": "hf-mirror", "repo": "FatalErrorVXD/ltx-desktop-assets", "subpath": "loras/ltx/LTX2.3_Crisp_Enhance.safetensors" }, "approx_bytes": 705198392, "recommended_strength": 0.9, "install_dir_env": "LORA_DIR", "setup_script": null, "uploaded_at": "2026-05-23" }, { "id": "loras-ltx-anime90s", "display_name": "Retro 90s Anime Style LoRA LTX-2.3 v2.1 (stacked LoRA)", "author": "tazmannner379", "canonical_source": "https://civitai.com/models/2557755/retro-90s-anime-style-lora-ltx-23", "required": false, "default_install": false, "license_refs": [], "license_note": "Inherits creator-set permissions on the CivitAI page above. Trigger words include show-specific tokens (SHW_AKIRA, SHW_CWBY, etc.) that reference copyrighted IP — use with care for commercial-adjacent outputs.", "source": { "type": "hf-mirror", "repo": "FatalErrorVXD/ltx-desktop-assets", "subpath": "loras/ltx/anime90s-step00053000.comfy.safetensors" }, "approx_bytes": 705198960, "trigger_words": ["ANIMSTY"], "recommended_strength_range": [0.8, 1.0], "install_dir_env": "LORA_DIR", "setup_script": null, "uploaded_at": "2026-05-23" } ], "_notes": [ "Components handled entirely by the existing LTX Desktop installer (LTX-2.3 family, Z-Image-Turbo, Gemma-3 text encoder, DPT/YOLOX/DW-Pose) are NOT listed here — they're outside this manifest's scope.", "approx_bytes is for progress UI / disk-space precheck. Real sizes set at upload time.", "Each component's setup_script is the existing per-component installer in ltx-desktop-mcp/. Manifest just changes where it pulls FROM (this mirror vs upstream) and inserts license-consent before each non-empty license_refs." ] }