diff --git a/demo/list_voices.py b/demo/list_voices.py
new file mode 100755
index 0000000..25e058b
--- /dev/null
+++ b/demo/list_voices.py
@@ -0,0 +1,276 @@
+#!/usr/bin/env python3
+"""
+VibeVoice Voice Listing Utility
+
+This script lists all available voice presets for VibeVoice models,
+including metadata like language and gender parsed from filenames.
+
+Usage:
+    python demo/list_voices.py [--format {table|json|simple}] [--lang LANG]
+
+Examples:
+    # List all voices in table format (default)
+    python demo/list_voices.py
+
+    # List only English voices
+    python demo/list_voices.py --lang en
+
+    # Output as JSON for programmatic use
+    python demo/list_voices.py --format json
+
+    # Simple list of voice names only
+    python demo/list_voices.py --format simple
+"""
+
+import argparse
+import json
+import os
+from pathlib import Path
+from typing import Dict, List, Optional
+
+
+class VoiceInfo:
+    """Represents metadata about a voice preset"""
+
+    def __init__(self, filename: str, path: Path):
+        self.filename = filename
+        self.path = path
+        self.name = filename  # Full name without extension
+
+        # Parse language code and speaker info from filename
+        # Expected format: {lang}-{SpeakerName}_{gender}.pt
+        # Examples: en-Carter_man.pt, de-Spk0_woman.pt
+        parts = filename.split('-', 1)
+
+        if len(parts) == 2:
+            self.language = parts[0]
+            speaker_part = parts[1]
+
+            # Extract speaker name and gender
+            if '_' in speaker_part:
+                self.speaker_name, self.gender = speaker_part.rsplit('_', 1)
+            else:
+                self.speaker_name = speaker_part
+                self.gender = 'unknown'
+        else:
+            # Fallback for non-standard naming
+            self.language = 'unknown'
+            self.speaker_name = filename
+            self.gender = 'unknown'
+
+        # Get file size
+        try:
+            self.size_mb = self.path.stat().st_size / (1024 * 1024)
+        except Exception:
+            self.size_mb = 0.0
+
+    def to_dict(self) -> Dict:
+        """Convert to dictionary for JSON serialization"""
+        return {
+            'name': self.name,
+            'language': self.language,
+            'speaker': self.speaker_name,
+            'gender': self.gender,
+            'size_mb': round(self.size_mb, 2),
+            'path': str(self.path),
+        }
+
+    @staticmethod
+    def get_language_name(code: str) -> str:
+        """Convert language code to full name"""
+        lang_map = {
+            'en': 'English',
+            'de': 'German',
+            'fr': 'French',
+            'it': 'Italian',
+            'jp': 'Japanese',
+            'kr': 'Korean',
+            'nl': 'Dutch',
+            'pl': 'Polish',
+            'pt': 'Portuguese',
+            'sp': 'Spanish',
+            'in': 'International',
+        }
+        return lang_map.get(code, code.upper())
+
+
+class VoiceManager:
+    """Manages voice presets and provides listing functionality"""
+
+    def __init__(self, voices_dir: Optional[Path] = None):
+        if voices_dir is None:
+            # Default to demo/voices/streaming_model
+            script_dir = Path(__file__).parent
+            voices_dir = script_dir / "voices" / "streaming_model"
+
+        self.voices_dir = Path(voices_dir)
+        self.voices: List[VoiceInfo] = []
+        self._load_voices()
+
+    def _load_voices(self):
+        """Load all voice presets from the voices directory"""
+        if not self.voices_dir.exists():
+            print(f"Warning: Voices directory not found at {self.voices_dir}")
+            return
+
+        # Find all .pt files
+        for pt_file in sorted(self.voices_dir.glob("*.pt")):
+            voice_info = VoiceInfo(pt_file.stem, pt_file)
+            self.voices.append(voice_info)
+
+    def filter_by_language(self, lang_code: str) -> List[VoiceInfo]:
+        """Filter voices by language code"""
+        return [v for v in self.voices if v.language.lower() == lang_code.lower()]
+
+    def get_by_name(self, name: str) -> Optional[VoiceInfo]:
+        """Get a specific voice by name"""
+        for voice in self.voices:
+            if voice.name == name or voice.speaker_name == name:
+                return voice
+        return None
+
+    def print_table(self, voices: Optional[List[VoiceInfo]] = None):
+        """Print voices in a formatted table"""
+        if voices is None:
+            voices = self.voices
+
+        if not voices:
+            print("No voices found.")
+            return
+
+        # Calculate column widths
+        name_width = max(len(v.name) for v in voices) + 2
+        speaker_width = max(len(v.speaker_name) for v in voices) + 2
+        lang_width = max(len(VoiceInfo.get_language_name(v.language)) for v in voices) + 2
+
+        # Ensure minimum widths
+        name_width = max(name_width, 20)
+        speaker_width = max(speaker_width, 15)
+        lang_width = max(lang_width, 12)
+
+        # Print header
+        print(f"\n{'Name':<{name_width}} {'Speaker':<{speaker_width}} {'Language':<{lang_width}} {'Gender':<8} {'Size (MB)':<10}")
+        print("=" * (name_width + speaker_width + lang_width + 28))
+
+        # Print voices
+        for voice in voices:
+            lang_name = VoiceInfo.get_language_name(voice.language)
+            print(f"{voice.name:<{name_width}} {voice.speaker_name:<{speaker_width}} {lang_name:<{lang_width}} {voice.gender:<8} {voice.size_mb:>8.2f}")
+
+        print(f"\nTotal: {len(voices)} voice(s)")
+
+    def print_simple(self, voices: Optional[List[VoiceInfo]] = None):
+        """Print simple list of voice names"""
+        if voices is None:
+            voices = self.voices
+
+        for voice in voices:
+            print(voice.name)
+
+    def to_json(self, voices: Optional[List[VoiceInfo]] = None) -> str:
+        """Convert voices to JSON format"""
+        if voices is None:
+            voices = self.voices
+
+        data = {
+            'total': len(voices),
+            'voices_directory': str(self.voices_dir),
+            'voices': [v.to_dict() for v in voices]
+        }
+        return json.dumps(data, indent=2)
+
+    def get_statistics(self) -> Dict:
+        """Get statistics about available voices"""
+        if not self.voices:
+            return {
+                'total': 0,
+                'by_language': {},
+                'by_gender': {},
+            }
+
+        # Count by language
+        by_lang = {}
+        for voice in self.voices:
+            lang = voice.language
+            by_lang[lang] = by_lang.get(lang, 0) + 1
+
+        # Count by gender
+        by_gender = {}
+        for voice in self.voices:
+            gender = voice.gender
+            by_gender[gender] = by_gender.get(gender, 0) + 1
+
+        return {
+            'total': len(self.voices),
+            'by_language': by_lang,
+            'by_gender': by_gender,
+        }
+
+
+def main():
+    parser = argparse.ArgumentParser(
+        description="List available VibeVoice voice presets",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+        epilog=__doc__
+    )
+    parser.add_argument(
+        '--format',
+        choices=['table', 'json', 'simple'],
+        default='table',
+        help='Output format (default: table)'
+    )
+    parser.add_argument(
+        '--lang',
+        type=str,
+        help='Filter by language code (e.g., en, de, fr)'
+    )
+    parser.add_argument(
+        '--voices-dir',
+        type=Path,
+        help='Path to voices directory (default: demo/voices/streaming_model)'
+    )
+    parser.add_argument(
+        '--stats',
+        action='store_true',
+        help='Show statistics about available voices'
+    )
+
+    args = parser.parse_args()
+
+    # Initialize voice manager
+    manager = VoiceManager(voices_dir=args.voices_dir)
+
+    # Filter by language if specified
+    voices = manager.voices
+    if args.lang:
+        voices = manager.filter_by_language(args.lang)
+        if not voices:
+            print(f"No voices found for language: {args.lang}")
+            return
+
+    # Show statistics if requested
+    if args.stats:
+        stats = manager.get_statistics()
+        print("\n=== Voice Statistics ===")
+        print(f"Total voices: {stats['total']}")
+        print("\nBy Language:")
+        for lang, count in sorted(stats['by_language'].items()):
+            lang_name = VoiceInfo.get_language_name(lang)
+            print(f"  {lang_name} ({lang}): {count}")
+        print("\nBy Gender:")
+        for gender, count in sorted(stats['by_gender'].items()):
+            print(f"  {gender.capitalize()}: {count}")
+        print()
+        return
+
+    # Display in requested format
+    if args.format == 'table':
+        manager.print_table(voices)
+    elif args.format == 'json':
+        print(manager.to_json(voices))
+    elif args.format == 'simple':
+        manager.print_simple(voices)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/demo/vibevoice_realtime_colab.ipynb b/demo/vibevoice_realtime_colab.ipynb
index 2f61407..bdacd8c 100644
--- a/demo/vibevoice_realtime_colab.ipynb
+++ b/demo/vibevoice_realtime_colab.ipynb
@@ -2,13 +2,12 @@
   "cells": [
     {
       "cell_type": "markdown",
-      "id": "d1785adb",
       "metadata": {
-        "colab_type": "text",
-        "id": "view-in-github"
+        "id": "view-in-github",
+        "colab_type": "text"
       },
       "source": [
-        "<a href=\"https://colab.research.google.com/github/microsoft/VibeVoice/blob/main/demo/vibevoice_realtime_colab.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
+        "<a href=\"https://colab.research.google.com/github/Finish-Him/VibeVoice/blob/main/demo/vibevoice_realtime_colab.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
       ]
     },
     {
@@ -34,12 +33,211 @@
     },
     {
       "cell_type": "code",
-      "execution_count": null,
+      "execution_count": 1,
       "id": "4wxJ6QHM-ZOb",
       "metadata": {
-        "id": "4wxJ6QHM-ZOb"
+        "id": "4wxJ6QHM-ZOb",
+        "outputId": "a9f42189-191e-484a-8cfb-5a272fce5b3e",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 310,
+          "referenced_widgets": [
+            "6aa0514fe8e74f87a8d25e2a3ec7b249",
+            "2e77995f5e9b4c9d93a1e50482e63464",
+            "5bddb298cd604fbba0776657ef807664",
+            "398d6a88664b44c89b06610a1b5eb33e",
+            "23e9f1b01aa6454bb8f63b74aaa333f5",
+            "411a5e8e282b4257b561655c637836ab",
+            "a85f891d3eb946fa94af2eff7024bc76",
+            "f112df2ccc7b4861a27f5336d38ac86f",
+            "24d904f0c7f94a749af6d440b475bdeb",
+            "5e994c7530c64e8ab571751a12684217",
+            "52eb275fb2ef41e1ba008baef9378dfe",
+            "0d8d3ac2411048a7b846835d60e4f23d",
+            "bc3d23550b01450e94574975277bf5a2",
+            "0df051569bd540b7a19e3aefdc69f7cd",
+            "b4351182f3b7462cbf915b26863cf4de",
+            "dae8d2fe62bd41ea9d99c9ccc817de46",
+            "e35dd504906745b28846c07a644c3423",
+            "8171a7d8dcb9432881aa56fb52743e3d",
+            "2058d4fb6b1745a2a971491fcc747244",
+            "c3311a8331244551843472284c58f60f",
+            "ddd6507456c9496db1525c87994c5e4a",
+            "be663377d2864ba3a4c6832ed9d77a3d",
+            "06dd326664c2487f8195c15c56326273",
+            "45b8402a7ce240c5b3e84520af47e6e3",
+            "f6374d57d06f4234ba5b29acbbec7c8d",
+            "cde3a6c088e545cf94e2ccc73655eff2",
+            "60723c32638d47dd81281d31ddc5eb66",
+            "b79622d7dc0e46e28ebd17d730bfe91d",
+            "027f223a86a249dd88b1010dc85f679f",
+            "7bf175a6594a4417899953186dfa8a97",
+            "620f2c3ccaac4028bd2668a12dc57749",
+            "1186b85637f2496ba1366ab4d2d2a11d",
+            "6e0d9876d9f94fca889a959b09319474",
+            "422ea9b78c584d1ca555728cd01e861b",
+            "063ce9a58fc748e7929ed70a72c1b287",
+            "75ebd541b72941b3935a96da96615293",
+            "7c6ad8b88a7c49ca980f14bb03fd1463",
+            "eb94263072dc4ab78a2f125840a5dda5",
+            "81ae6a64fbee460ab6c15b5cc0448474",
+            "3607d7c97912499191b8b632f29bc31d",
+            "9006110b3b8043dfbe85d1c485242834",
+            "4ca65f86d3a344eeb43f1e10ce2bade7",
+            "8fee63d65695482f9c68294816a98a6b",
+            "73e3840872fe4245aa88c315fe266214",
+            "f133d8b35d8f461d9e3b0c099d56dc98",
+            "c6c3ec7e97554e3f930cdcab2e3002fa",
+            "73a5e9fc2808494485db6768fdb6ac6e",
+            "d30457cbc6fa4a54902bc92640af82ce",
+            "a9c4e87ff31e458187e09e93b23bcaed",
+            "0af92bfff186463ab480139f415b3f45",
+            "2974cc410d6e40d89cdb0a600943d70e",
+            "f48cf6761d6d493cb76c0030249baa11",
+            "3ea8f4b8b4e54b99a48d410fe9659f96",
+            "4a7829162a704c62b40823c359c5c86e",
+            "c23a9a4b3ab044d6af40f293d7249733",
+            "50ac88eac535450a8f249f52092d2406",
+            "9ab10fe6f69d40de8a90d924288611bd",
+            "94a9a23ebefa45ad9604bcf353844337",
+            "e687b3ff73cb4b42964d46ade98a2b65",
+            "c705ff6baaf5438b93dbc4107b1c4305",
+            "306e3356465c4898a5f2b5ccb29aaa7c",
+            "9ec13363e1f046368343d27f41b08f19",
+            "1350cc445a004aff895cab877697cc3c",
+            "48bc89fef2724841b2f182cc6eed35e0",
+            "68ffa713da0a4b01b2c42e0c8a27835e",
+            "a8e4a36558e04810b203b32cdd298ffb",
+            "5b08b3a3aa6b4c0fb19167850be8453d",
+            "884ec6a31fdf410e92c5ea89c0e1419b",
+            "3e99d2ab170c45fe844cb81fed3ee1d7",
+            "4e2e16fb3c5e41429a3660f65c488d8f",
+            "058a4595e6c042bfa0df510046f1109d",
+            "5c2b36b95d60431a8bbf553e408f4f51",
+            "a695abbe11304923bb22390b6b8d7af2",
+            "47885c9ca7c943d18b0f6529ca6a8238",
+            "772eb2290aef43e4947878efd7794ce7",
+            "53f6ef4e80384e8aa06628a35c354e8f",
+            "83077e8e24ef484ab79eb4eefd441c80"
+          ]
+        }
       },
-      "outputs": [],
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "✅ T4 GPU detected\n",
+            "✅ Cloned VibeVoice repository\n",
+            "✅ Installed dependencies\n"
+          ]
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "Fetching 6 files:   0%|          | 0/6 [00:00<?, ?it/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "6aa0514fe8e74f87a8d25e2a3ec7b249"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "figures/Fig1.png:   0%|          | 0.00/124k [00:00<?, ?B/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "0d8d3ac2411048a7b846835d60e4f23d"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "model.safetensors:   0%|          | 0.00/2.04G [00:00<?, ?B/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "06dd326664c2487f8195c15c56326273"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "config.json: 0.00B [00:00, ?B/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "422ea9b78c584d1ca555728cd01e861b"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              ".gitattributes: 0.00B [00:00, ?B/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "f133d8b35d8f461d9e3b0c099d56dc98"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "preprocessor_config.json:   0%|          | 0.00/360 [00:00<?, ?B/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "50ac88eac535450a8f249f52092d2406"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "README.md: 0.00B [00:00, ?B/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "5b08b3a3aa6b4c0fb19167850be8453d"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "✅ Downloaded model: microsoft/VibeVoice-Realtime-0.5B\n"
+          ]
+        }
+      ],
       "source": [
         "# Check for T4 GPU\n",
         "import torch\n",
@@ -79,17 +277,63 @@
     {
       "cell_type": "markdown",
       "id": "88c727ab",
-      "metadata": {},
+      "metadata": {
+        "id": "88c727ab"
+      },
       "source": [
         "[Optional] If the download exceeds 1 minute, it is probably stuck. You can: (1) interrupt the execution, (2) log in to Hugging Face, and (3) try download again."
       ]
     },
     {
       "cell_type": "code",
-      "execution_count": null,
+      "execution_count": 2,
       "id": "dec6b870",
-      "metadata": {},
-      "outputs": [],
+      "metadata": {
+        "id": "dec6b870",
+        "outputId": "cdfbd4ed-b5fa-43cb-d839-c801bc04909b",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 17,
+          "referenced_widgets": [
+            "9c57910a71314b5ab996439e5130adfe",
+            "caf8f6f8920d4f01aa2af4f9e6fcb3dc",
+            "afaace7433ee4538844cd73480589dda",
+            "70fadafd4db04a0783e329362ba8b87c",
+            "dfcc460d6f424736be2fb25530b09185",
+            "c004c599ecc943e18ee873d55ee630ea",
+            "8f96189e4dd146679c62ae79e1ecc4b1",
+            "687266971acc4ab1b03813bc8a3b8e76",
+            "4bde1aea8d194644b4e9021f09503800",
+            "fa49258b8fe3441a82c22e9b60a955df",
+            "40db57ec16eb4e4ba4cd506abaf4069b",
+            "b17a44ac600746f6a1825cbb0cc063be",
+            "683c557013424a18a85422835b75a8e3",
+            "2e5bc5e6f4ef48b0b00424049cec8a09",
+            "b13735cb5c4249a08d8c7cfa654ba106",
+            "161a12ab57aa41638a846a2238bf9642",
+            "0332ed76bfde46c49c9879f36e75f6f3",
+            "2d2751bc81ca4bd5bef927b23a99ee93",
+            "8deb0245c1164c0192ac324a38f32971",
+            "054055b8c233424d82c435f0d453fa56"
+          ]
+        }
+      },
+      "outputs": [
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "VBox(children=(HTML(value='<center> <img\\nsrc=https://huggingface.co/front/assets/huggingface_logo-noborder.sv…"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "9c57910a71314b5ab996439e5130adfe"
+            }
+          },
+          "metadata": {}
+        }
+      ],
       "source": [
         "from huggingface_hub import login\n",
         "login()"
@@ -97,10 +341,52 @@
     },
     {
       "cell_type": "code",
-      "execution_count": null,
+      "execution_count": 3,
       "id": "c579654b",
-      "metadata": {},
-      "outputs": [],
+      "metadata": {
+        "id": "c579654b",
+        "outputId": "2a080db9-d5a2-40d4-bf3a-f8a33e0c5d1f",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 66,
+          "referenced_widgets": [
+            "a6612ce289c246668325ec1c50b01a3e",
+            "c85a7873e70f4345a071cbe453bbe801",
+            "045a67c7b0cf467b8066370dd9e7ffef",
+            "8c84ea605447464f84e6b51f0790461b",
+            "9486fe93c26c4ab18b26c6c06d87c9f0",
+            "405497428efc4015932fc2e76ceb110f",
+            "a8d7ef0c5f18419983e1c3077deb4154",
+            "04a4242afe6c4fb19aed5282d9110df2",
+            "27adab0a48c24c3ba388c7ed0cbc8073",
+            "8987b61805774e3fbc660b1ddf477fff",
+            "9f543c4a97314ebd836f0f8ce3f525cb"
+          ]
+        }
+      },
+      "outputs": [
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/plain": [
+              "Fetching 6 files:   0%|          | 0/6 [00:00<?, ?it/s]"
+            ],
+            "application/vnd.jupyter.widget-view+json": {
+              "version_major": 2,
+              "version_minor": 0,
+              "model_id": "a6612ce289c246668325ec1c50b01a3e"
+            }
+          },
+          "metadata": {}
+        },
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "✅ Downloaded model: microsoft/VibeVoice-Realtime-0.5B\n"
+          ]
+        }
+      ],
       "source": [
         "snapshot_download(\"microsoft/VibeVoice-Realtime-0.5B\", local_dir=\"/content/models/VibeVoice-Realtime-0.5B\")\n",
         "print(\"✅ Downloaded model: microsoft/VibeVoice-Realtime-0.5B\")"
@@ -139,9 +425,708 @@
       "execution_count": null,
       "id": "Yc1N9EHswFxA",
       "metadata": {
-        "id": "Yc1N9EHswFxA"
+        "id": "Yc1N9EHswFxA",
+        "outputId": "67fffde3-7670-4787-ee33-0128b6fd3bf8",
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        }
       },
-      "outputs": [],
+      "outputs": [
+        {
+          "output_type": "stream",
+          "name": "stdout",
+          "text": [
+            "2025-12-15 10:18:26.163671: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:467] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered\n",
+            "WARNING: All log messages before absl::InitializeLog() is called are written to STDERR\n",
+            "E0000 00:00:1765793906.193886    1910 cuda_dnn.cc:8579] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered\n",
+            "E0000 00:00:1765793906.202097    1910 cuda_blas.cc:1407] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n",
+            "W0000 00:00:1765793906.222444    1910 computation_placer.cc:177] computation placer already registered. Please check linkage and avoid linking the same target more than once.\n",
+            "W0000 00:00:1765793906.222475    1910 computation_placer.cc:177] computation placer already registered. Please check linkage and avoid linking the same target more than once.\n",
+            "W0000 00:00:1765793906.222478    1910 computation_placer.cc:177] computation placer already registered. Please check linkage and avoid linking the same target more than once.\n",
+            "W0000 00:00:1765793906.222480    1910 computation_placer.cc:177] computation placer already registered. Please check linkage and avoid linking the same target more than once.\n",
+            "2025-12-15 10:18:26.229465: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
+            "To enable the following instructions: AVX2 AVX512F FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
+            "WARNING:vibevoice.modular.modular_vibevoice_tokenizer:APEX FusedRMSNorm not available, using native implementation\n",
+            "INFO:     Started server process [1910]\n",
+            "INFO:     Waiting for application startup.\n",
+            "The tokenizer class you load from this checkpoint is not the same type as the class this function is called from. It may result in unexpected tokenization.\n",
+            "The tokenizer class you load from this checkpoint is 'Qwen2Tokenizer'.\n",
+            "The class this function is called from is 'VibeVoiceTextTokenizerFast'.\n",
+            "INFO:     Application startup complete.\n",
+            "INFO:     Uvicorn running on http://0.0.0.0:8000 (Press CTRL+C to quit)\n",
+            "✅ Public URL: https://labels-thriller-recovered-switched.trycloudflare.com\n",
+            "\n",
+            "[startup] Loading processor from /content/models/VibeVoice-Realtime-0.5B\n",
+            "Using device: cuda, torch_dtype: torch.bfloat16, attn_implementation: flash_attention_2\n",
+            "Error loading the model. Trying to use SDPA. However, note that only flash_attention_2 has been fully tested, and using SDPA may result in lower audio quality.\n",
+            "Load model with SDPA successfully\n",
+            "[startup] Found 25 voice presets\n",
+            "[startup] Using fallback voice preset: de-Spk0_man\n",
+            "[startup] Loading voice preset de-Spk0_man from /content/VibeVoice/demo/voices/streaming_model/de-Spk0_man.pt\n",
+            "[startup] Loading prefilled prompt from /content/VibeVoice/demo/voices/streaming_model/de-Spk0_man.pt\n",
+            "[startup] Model ready.\n",
+            "INFO:     2804:b14:8104:2d70:7cd6:a747:afdf:1b51:0 - \"GET / HTTP/1.1\" 200 OK\n",
+            "INFO:     2804:b14:8104:2d70:7cd6:a747:afdf:1b51:0 - \"GET /config HTTP/1.1\" 200 OK\n",
+            "INFO:     2804:b14:8104:2d70:7cd6:a747:afdf:1b51:0 - \"GET /favicon.ico HTTP/1.1\" 404 Not Found\n",
+            "INFO:     2804:b14:8104:2d70:5108:55d0:5e0a:75b4:0 - \"GET / HTTP/1.1\" 200 OK\n",
+            "INFO:     2804:b14:8104:2d70:5108:55d0:5e0a:75b4:0 - \"GET /config HTTP/1.1\" 200 OK\n",
+            "INFO:     2804:b14:8104:2d70:5108:55d0:5e0a:75b4:0 - \"GET /favicon.ico HTTP/1.1\" 404 Not Found\n",
+            "INFO:     2804:b14:8104:2d70:5108:55d0:5e0a:75b4:0 - \"WebSocket /stream?text=Enter+your+text+here+and+click+%22Start%22+to+instantly+hear+the+VibeVoice-Realtime+TTS+output+audio.&cfg=1.500&steps=5&voice=de-Spk0_man\" [accepted]\n",
+            "INFO:     connection open\n",
+            "Client connected, text='Enter your text here and click \"Start\" to instantly hear the VibeVoice-Realtime TTS output audio.'\n",
+            "\n",
+            "Prefilled 510 tokens, current step (510 / 8192):   6%|▌         | 510/8192 [00:00<?, ?it/s]\n",
+            "Prefilled 5 text tokens, generated 0 speech tokens, current step (515 / 8192):   6%|▋         | 515/8192 [00:00<00:00, 17549.39it/s]\n",
+            "Prefilled 5 text tokens, generated 0 speech tokens, current step (515 / 8192):   6%|▋         | 516/8192 [00:01<21:48,  5.87it/s]\n",
+            "Prefilled 5 text tokens, generated 1 speech tokens, current step (516 / 8192):   6%|▋         | 516/8192 [00:01<21:48,  5.87it/s]\n",
+            "Prefilled 5 text tokens, generated 1 speech tokens, current step (516 / 8192):   6%|▋         | 517/8192 [00:01<22:13,  5.76it/s]\n",
+            "Prefilled 5 text tokens, generated 2 speech tokens, current step (517 / 8192):   6%|▋         | 517/8192 [00:01<22:13,  5.76it/s]\n",
+            "Prefilled 5 text tokens, generated 2 speech tokens, current step (517 / 8192):   6%|▋         | 518/8192 [00:01<21:17,  6.01it/s]\n",
+            "Prefilled 5 text tokens, generated 3 speech tokens, current step (518 / 8192):   6%|▋         | 518/8192 [00:01<21:17,  6.01it/s]\n",
+            "Prefilled 5 text tokens, generated 3 speech tokens, current step (518 / 8192):   6%|▋         | 519/8192 [00:01<19:58,  6.40it/s]\n",
+            "Prefilled 5 text tokens, generated 4 speech tokens, current step (519 / 8192):   6%|▋         | 519/8192 [00:01<19:58,  6.40it/s]\n",
+            "Prefilled 5 text tokens, generated 4 speech tokens, current step (519 / 8192):   6%|▋         | 520/8192 [00:01<19:09,  6.68it/s]\n",
+            "Prefilled 5 text tokens, generated 5 speech tokens, current step (520 / 8192):   6%|▋         | 520/8192 [00:01<19:09,  6.68it/s]\n",
+            "Prefilled 5 text tokens, generated 5 speech tokens, current step (520 / 8192):   6%|▋         | 521/8192 [00:01<17:46,  7.19it/s]\n",
+            "Prefilled 5 text tokens, generated 6 speech tokens, current step (521 / 8192):   6%|▋         | 521/8192 [00:01<17:46,  7.19it/s]\n",
+            "Prefilled 10 text tokens, generated 6 speech tokens, current step (526 / 8192):   6%|▋         | 526/8192 [00:01<17:45,  7.19it/s]\n",
+            "Prefilled 10 text tokens, generated 6 speech tokens, current step (526 / 8192):   6%|▋         | 527/8192 [00:01<07:35, 16.81it/s]\n",
+            "Prefilled 10 text tokens, generated 7 speech tokens, current step (527 / 8192):   6%|▋         | 527/8192 [00:01<07:35, 16.81it/s]\n",
+            "Prefilled 10 text tokens, generated 8 speech tokens, current step (528 / 8192):   6%|▋         | 528/8192 [00:01<07:35, 16.81it/s]\n",
+            "Prefilled 10 text tokens, generated 8 speech tokens, current step (528 / 8192):   6%|▋         | 529/8192 [00:02<09:05, 14.04it/s]\n",
+            "Prefilled 10 text tokens, generated 9 speech tokens, current step (529 / 8192):   6%|▋         | 529/8192 [00:02<09:05, 14.04it/s]\n",
+            "Prefilled 10 text tokens, generated 10 speech tokens, current step (530 / 8192):   6%|▋         | 530/8192 [00:02<09:05, 14.04it/s]\n",
+            "Prefilled 10 text tokens, generated 10 speech tokens, current step (530 / 8192):   6%|▋         | 531/8192 [00:02<10:05, 12.64it/s]\n",
+            "Prefilled 10 text tokens, generated 11 speech tokens, current step (531 / 8192):   6%|▋         | 531/8192 [00:02<10:05, 12.64it/s]\n",
+            "Prefilled 10 text tokens, generated 12 speech tokens, current step (532 / 8192):   6%|▋         | 532/8192 [00:02<10:05, 12.64it/s]\n",
+            "Prefilled 10 text tokens, generated 12 speech tokens, current step (532 / 8192):   7%|▋         | 537/8192 [00:02<06:28, 19.70it/s]\n",
+            "Prefilled 15 text tokens, generated 12 speech tokens, current step (537 / 8192):   7%|▋         | 537/8192 [00:02<06:28, 19.70it/s]\n",
+            "Prefilled 15 text tokens, generated 13 speech tokens, current step (538 / 8192):   7%|▋         | 538/8192 [00:02<06:28, 19.70it/s]\n",
+            "Prefilled 15 text tokens, generated 14 speech tokens, current step (539 / 8192):   7%|▋         | 539/8192 [00:02<06:28, 19.70it/s]\n",
+            "Prefilled 15 text tokens, generated 14 speech tokens, current step (539 / 8192):   7%|▋         | 540/8192 [00:02<08:11, 15.56it/s]\n",
+            "Prefilled 15 text tokens, generated 15 speech tokens, current step (540 / 8192):   7%|▋         | 540/8192 [00:02<08:11, 15.56it/s]\n",
+            "Prefilled 15 text tokens, generated 16 speech tokens, current step (541 / 8192):   7%|▋         | 541/8192 [00:02<08:11, 15.56it/s]\n",
+            "Prefilled 15 text tokens, generated 16 speech tokens, current step (541 / 8192):   7%|▋         | 542/8192 [00:02<09:12, 13.86it/s]\n",
+            "Prefilled 15 text tokens, generated 17 speech tokens, current step (542 / 8192):   7%|▋         | 542/8192 [00:02<09:12, 13.86it/s]\n",
+            "Prefilled 15 text tokens, generated 18 speech tokens, current step (543 / 8192):   7%|▋         | 543/8192 [00:03<09:11, 13.86it/s]\n",
+            "Prefilled 15 text tokens, generated 18 speech tokens, current step (543 / 8192):   7%|▋         | 548/8192 [00:03<06:23, 19.95it/s]\n",
+            "Prefilled 20 text tokens, generated 18 speech tokens, current step (548 / 8192):   7%|▋         | 548/8192 [00:03<06:23, 19.95it/s]\n",
+            "Prefilled 20 text tokens, generated 19 speech tokens, current step (549 / 8192):   7%|▋         | 549/8192 [00:03<06:23, 19.95it/s]\n",
+            "Prefilled 20 text tokens, generated 20 speech tokens, current step (550 / 8192):   7%|▋         | 550/8192 [00:03<06:23, 19.95it/s]\n",
+            "Prefilled 20 text tokens, generated 20 speech tokens, current step (550 / 8192):   7%|▋         | 551/8192 [00:03<07:53, 16.13it/s]\n",
+            "Prefilled 20 text tokens, generated 21 speech tokens, current step (551 / 8192):   7%|▋         | 551/8192 [00:03<07:53, 16.13it/s]\n",
+            "Prefilled 20 text tokens, generated 22 speech tokens, current step (552 / 8192):   7%|▋         | 552/8192 [00:03<07:53, 16.13it/s]\n",
+            "Prefilled 20 text tokens, generated 22 speech tokens, current step (552 / 8192):   7%|▋         | 553/8192 [00:03<09:01, 14.11it/s]\n",
+            "Prefilled 20 text tokens, generated 23 speech tokens, current step (553 / 8192):   7%|▋         | 553/8192 [00:03<09:01, 14.11it/s]\n",
+            "Prefilled 20 text tokens, generated 24 speech tokens, current step (554 / 8192):   7%|▋         | 554/8192 [00:03<09:01, 14.11it/s]\n",
+            "Prefilled 20 text tokens, generated 24 speech tokens, current step (554 / 8192):   7%|▋         | 558/8192 [00:03<07:00, 18.17it/s]\n",
+            "Prefilled 24 text tokens, generated 24 speech tokens, current step (558 / 8192):   7%|▋         | 558/8192 [00:03<07:00, 18.17it/s]\n",
+            "Prefilled 24 text tokens, generated 25 speech tokens, current step (559 / 8192):   7%|▋         | 559/8192 [00:03<07:00, 18.17it/s]\n",
+            "Prefilled 24 text tokens, generated 26 speech tokens, current step (560 / 8192):   7%|▋         | 560/8192 [00:03<06:59, 18.17it/s]\n",
+            "Prefilled 24 text tokens, generated 26 speech tokens, current step (560 / 8192):   7%|▋         | 561/8192 [00:04<08:42, 14.60it/s]\n",
+            "Prefilled 24 text tokens, generated 27 speech tokens, current step (561 / 8192):   7%|▋         | 561/8192 [00:04<08:42, 14.60it/s]\n",
+            "Prefilled 24 text tokens, generated 28 speech tokens, current step (562 / 8192):   7%|▋         | 562/8192 [00:04<08:42, 14.60it/s]\n",
+            "Prefilled 24 text tokens, generated 28 speech tokens, current step (562 / 8192):   7%|▋         | 563/8192 [00:04<09:42, 13.10it/s]\n",
+            "Prefilled 24 text tokens, generated 29 speech tokens, current step (563 / 8192):   7%|▋         | 563/8192 [00:04<09:42, 13.10it/s]\n",
+            "Prefilled 24 text tokens, generated 30 speech tokens, current step (564 / 8192):   7%|▋         | 564/8192 [00:04<09:42, 13.10it/s]\n",
+            "Prefilled 24 text tokens, generated 30 speech tokens, current step (564 / 8192):   7%|▋         | 565/8192 [00:04<10:31, 12.08it/s]\n",
+            "Prefilled 24 text tokens, generated 31 speech tokens, current step (565 / 8192):   7%|▋         | 565/8192 [00:04<10:31, 12.08it/s]\n",
+            "Prefilled 24 text tokens, generated 32 speech tokens, current step (566 / 8192):   7%|▋         | 566/8192 [00:04<10:31, 12.08it/s]\n",
+            "Prefilled 24 text tokens, generated 32 speech tokens, current step (566 / 8192):   7%|▋         | 567/8192 [00:04<11:19, 11.22it/s]\n",
+            "Prefilled 24 text tokens, generated 33 speech tokens, current step (567 / 8192):   7%|▋         | 567/8192 [00:04<11:19, 11.22it/s]\n",
+            "Prefilled 24 text tokens, generated 34 speech tokens, current step (568 / 8192):   7%|▋         | 568/8192 [00:04<11:19, 11.22it/s]\n",
+            "Prefilled 24 text tokens, generated 34 speech tokens, current step (568 / 8192):   7%|▋         | 569/8192 [00:04<11:56, 10.64it/s]\n",
+            "Prefilled 24 text tokens, generated 35 speech tokens, current step (569 / 8192):   7%|▋         | 569/8192 [00:04<11:56, 10.64it/s]\n",
+            "Prefilled 24 text tokens, generated 36 speech tokens, current step (570 / 8192):   7%|▋         | 570/8192 [00:05<11:56, 10.64it/s]\n",
+            "Prefilled 24 text tokens, generated 36 speech tokens, current step (570 / 8192):   7%|▋         | 571/8192 [00:05<13:08,  9.67it/s]\n",
+            "Prefilled 24 text tokens, generated 37 speech tokens, current step (571 / 8192):   7%|▋         | 571/8192 [00:05<13:08,  9.67it/s]\n",
+            "Prefilled 24 text tokens, generated 38 speech tokens, current step (572 / 8192):   7%|▋         | 572/8192 [00:05<13:08,  9.67it/s]\n",
+            "Prefilled 24 text tokens, generated 38 speech tokens, current step (572 / 8192):   7%|▋         | 573/8192 [00:05<14:15,  8.90it/s]\n",
+            "Prefilled 24 text tokens, generated 39 speech tokens, current step (573 / 8192):   7%|▋         | 573/8192 [00:05<14:15,  8.90it/s]\n",
+            "Prefilled 24 text tokens, generated 39 speech tokens, current step (573 / 8192):   7%|▋         | 574/8192 [00:05<14:31,  8.74it/s]\n",
+            "Prefilled 24 text tokens, generated 40 speech tokens, current step (574 / 8192):   7%|▋         | 574/8192 [00:05<14:31,  8.74it/s]\n",
+            "Prefilled 24 text tokens, generated 40 speech tokens, current step (574 / 8192):   7%|▋         | 575/8192 [00:05<15:13,  8.34it/s]\n",
+            "Prefilled 24 text tokens, generated 41 speech tokens, current step (575 / 8192):   7%|▋         | 575/8192 [00:05<15:13,  8.34it/s]\n",
+            "Prefilled 24 text tokens, generated 41 speech tokens, current step (575 / 8192):   7%|▋         | 576/8192 [00:05<15:24,  8.24it/s]\n",
+            "Prefilled 24 text tokens, generated 42 speech tokens, current step (576 / 8192):   7%|▋         | 576/8192 [00:05<15:24,  8.24it/s]\n",
+            "Prefilled 24 text tokens, generated 42 speech tokens, current step (576 / 8192):   7%|▋         | 577/8192 [00:05<15:44,  8.06it/s]\n",
+            "Prefilled 24 text tokens, generated 43 speech tokens, current step (577 / 8192):   7%|▋         | 577/8192 [00:05<15:44,  8.06it/s]INFO:     connection closed\n",
+            "\n",
+            "Prefilled 24 text tokens, generated 43 speech tokens, current step (577 / 8192):   7%|▋         | 578/8192 [00:06<15:44,  8.06it/s]\n",
+            "Prefilled 24 text tokens, generated 44 speech tokens, current step (578 / 8192):   7%|▋         | 578/8192 [00:06<15:44,  8.06it/s]\n",
+            "Prefilled 24 text tokens, generated 44 speech tokens, current step (578 / 8192):   7%|▋         | 579/8192 [00:06<15:47,  8.03it/s]\n",
+            "Prefilled 24 text tokens, generated 45 speech tokens, current step (579 / 8192):   7%|▋         | 579/8192 [00:06<15:47,  8.03it/s]\n",
+            "Prefilled 24 text tokens, generated 45 speech tokens, current step (579 / 8192):   7%|▋         | 580/8192 [00:06<15:47,  8.04it/s]\n",
+            "Prefilled 24 text tokens, generated 46 speech tokens, current step (580 / 8192):   7%|▋         | 580/8192 [00:06<15:47,  8.04it/s]\n",
+            "Prefilled 24 text tokens, generated 46 speech tokens, current step (580 / 8192):   7%|▋         | 581/8192 [00:06<16:21,  7.76it/s]\n",
+            "Prefilled 24 text tokens, generated 47 speech tokens, current step (581 / 8192):   7%|▋         | 581/8192 [00:06<16:21,  7.76it/s]\n",
+            "Prefilled 24 text tokens, generated 47 speech tokens, current step (581 / 8192):   7%|▋         | 582/8192 [00:06<16:18,  7.77it/s]\n",
+            "Prefilled 24 text tokens, generated 48 speech tokens, current step (582 / 8192):   7%|▋         | 582/8192 [00:06<16:18,  7.77it/s]\n",
+            "\n",
+            "ERROR:    Exception in ASGI application\n",
+            "Traceback (most recent call last):\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/uvicorn/protocols/websockets/websockets_impl.py\", line 244, in run_asgi\n",
+            "result = await self.app(self.scope, self.asgi_receive, self.asgi_send)  # type: ignore[func-returns-value]\n",
+            "^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/uvicorn/middleware/proxy_headers.py\", line 60, in __call__\n",
+            "return await self.app(scope, receive, send)\n",
+            "^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/fastapi/applications.py\", line 1133, in __call__\n",
+            "await super().__call__(scope, receive, send)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/applications.py\", line 113, in __call__\n",
+            "await self.middleware_stack(scope, receive, send)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/middleware/errors.py\", line 151, in __call__\n",
+            "await self.app(scope, receive, send)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/middleware/exceptions.py\", line 63, in __call__\n",
+            "await wrap_app_handling_exceptions(self.app, conn)(scope, receive, send)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/_exception_handler.py\", line 53, in wrapped_app\n",
+            "raise exc\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/_exception_handler.py\", line 42, in wrapped_app\n",
+            "await app(scope, receive, sender)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/fastapi/middleware/asyncexitstack.py\", line 18, in __call__\n",
+            "await self.app(scope, receive, send)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/routing.py\", line 716, in __call__\n",
+            "await self.middleware_stack(scope, receive, send)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/routing.py\", line 736, in app\n",
+            "await route.handle(scope, receive, send)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/routing.py\", line 364, in handle\n",
+            "await self.app(scope, receive, send)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/fastapi/routing.py\", line 149, in app\n",
+            "await wrap_app_handling_exceptions(app, session)(scope, receive, send)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/_exception_handler.py\", line 53, in wrapped_app\n",
+            "raise exc\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/_exception_handler.py\", line 42, in wrapped_app\n",
+            "await app(scope, receive, sender)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/fastapi/routing.py\", line 146, in app\n",
+            "await func(session)\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/fastapi/routing.py\", line 459, in app\n",
+            "await dependant.call(**solved_result.values)\n",
+            "File \"/content/VibeVoice/demo/web/app.py\", line 487, in websocket_stream\n",
+            "await ws.close()\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/websockets.py\", line 181, in close\n",
+            "await self.send({\"type\": \"websocket.close\", \"code\": code, \"reason\": reason or \"\"})\n",
+            "File \"/usr/local/lib/python3.12/dist-packages/starlette/websockets.py\", line 98, in send\n",
+            "raise RuntimeError('Cannot call \"send\" once a close message has been sent.')\n",
+            "RuntimeError: Cannot call \"send\" once a close message has been sent.\n",
+            "INFO:     2804:b14:8104:2d70:5108:55d0:5e0a:75b4:0 - \"WebSocket /stream?text=Enter+your+text+here+and+click+%22Start%22+to+instantly+hear+the+VibeVoice-Realtime+TTS+output+audio.&cfg=1.500&steps=5&voice=pt-Spk1_man\" [accepted]\n",
+            "INFO:     connection open\n",
+            "Client disconnected (WebSocketDisconnect)\n",
+            "Client connected, text='Enter your text here and click \"Start\" to instantly hear the VibeVoice-Realtime TTS output audio.'\n",
+            "[startup] Loading voice preset pt-Spk1_man from /content/VibeVoice/demo/voices/streaming_model/pt-Spk1_man.pt\n",
+            "[startup] Loading prefilled prompt from /content/VibeVoice/demo/voices/streaming_model/pt-Spk1_man.pt\n",
+            "\n",
+            "Prefilled 259 tokens, current step (259 / 8192):   3%|▎         | 259/8192 [00:00<?, ?it/s]\n",
+            "Prefilled 5 text tokens, generated 0 speech tokens, current step (264 / 8192):   3%|▎         | 264/8192 [00:00<00:00, 32716.88it/s]\n",
+            "Prefilled 5 text tokens, generated 0 speech tokens, current step (264 / 8192):   3%|▎         | 265/8192 [00:00<03:29, 37.92it/s]\n",
+            "Prefilled 5 text tokens, generated 1 speech tokens, current step (265 / 8192):   3%|▎         | 265/8192 [00:00<03:29, 37.92it/s]\n",
+            "Prefilled 5 text tokens, generated 2 speech tokens, current step (266 / 8192):   3%|▎         | 266/8192 [00:00<03:29, 37.92it/s]\n",
+            "Prefilled 5 text tokens, generated 3 speech tokens, current step (267 / 8192):   3%|▎         | 267/8192 [00:00<03:28, 37.92it/s]\n",
+            "Prefilled 5 text tokens, generated 4 speech tokens, current step (268 / 8192):   3%|▎         | 268/8192 [00:00<03:28, 37.92it/s]\n",
+            "Prefilled 5 text tokens, generated 4 speech tokens, current step (268 / 8192):   3%|▎         | 269/8192 [00:00<09:05, 14.52it/s]\n",
+            "Prefilled 5 text tokens, generated 5 speech tokens, current step (269 / 8192):   3%|▎         | 269/8192 [00:00<09:05, 14.52it/s]\n",
+            "Prefilled 5 text tokens, generated 6 speech tokens, current step (270 / 8192):   3%|▎         | 270/8192 [00:00<09:05, 14.52it/s]\n",
+            "Prefilled 5 text tokens, generated 6 speech tokens, current step (270 / 8192):   3%|▎         | 275/8192 [00:00<06:20, 20.81it/s]\n",
+            "Prefilled 10 text tokens, generated 6 speech tokens, current step (275 / 8192):   3%|▎         | 275/8192 [00:00<06:20, 20.81it/s]\n",
+            "Prefilled 10 text tokens, generated 7 speech tokens, current step (276 / 8192):   3%|▎         | 276/8192 [00:00<06:20, 20.81it/s]\n",
+            "Prefilled 10 text tokens, generated 8 speech tokens, current step (277 / 8192):   3%|▎         | 277/8192 [00:00<06:20, 20.81it/s]\n",
+            "Prefilled 10 text tokens, generated 8 speech tokens, current step (277 / 8192):   3%|▎         | 278/8192 [00:01<08:21, 15.77it/s]\n",
+            "Prefilled 10 text tokens, generated 9 speech tokens, current step (278 / 8192):   3%|▎         | 278/8192 [00:01<08:21, 15.77it/s]\n",
+            "Prefilled 10 text tokens, generated 10 speech tokens, current step (279 / 8192):   3%|▎         | 279/8192 [00:01<08:21, 15.77it/s]\n",
+            "Prefilled 10 text tokens, generated 11 speech tokens, current step (280 / 8192):   3%|▎         | 280/8192 [00:01<08:21, 15.77it/s]\n",
+            "Prefilled 10 text tokens, generated 11 speech tokens, current step (280 / 8192):   3%|▎         | 281/8192 [00:01<09:55, 13.28it/s]\n",
+            "Prefilled 10 text tokens, generated 12 speech tokens, current step (281 / 8192):   3%|▎         | 281/8192 [00:01<09:55, 13.28it/s]\n",
+            "Prefilled 15 text tokens, generated 12 speech tokens, current step (286 / 8192):   3%|▎         | 286/8192 [00:01<09:55, 13.28it/s]\n",
+            "Prefilled 15 text tokens, generated 12 speech tokens, current step (286 / 8192):   4%|▎         | 287/8192 [00:01<06:53, 19.11it/s]\n",
+            "Prefilled 15 text tokens, generated 13 speech tokens, current step (287 / 8192):   4%|▎         | 287/8192 [00:01<06:53, 19.11it/s]\n",
+            "Prefilled 15 text tokens, generated 14 speech tokens, current step (288 / 8192):   4%|▎         | 288/8192 [00:01<06:53, 19.11it/s]\n",
+            "Prefilled 15 text tokens, generated 15 speech tokens, current step (289 / 8192):   4%|▎         | 289/8192 [00:01<06:53, 19.11it/s]\n",
+            "Prefilled 15 text tokens, generated 15 speech tokens, current step (289 / 8192):   4%|▎         | 290/8192 [00:01<08:30, 15.47it/s]\n",
+            "Prefilled 15 text tokens, generated 16 speech tokens, current step (290 / 8192):   4%|▎         | 290/8192 [00:01<08:30, 15.47it/s]\n",
+            "Prefilled 15 text tokens, generated 17 speech tokens, current step (291 / 8192):   4%|▎         | 291/8192 [00:01<08:30, 15.47it/s]\n",
+            "Prefilled 15 text tokens, generated 18 speech tokens, current step (292 / 8192):   4%|▎         | 292/8192 [00:02<08:30, 15.47it/s]\n",
+            "Prefilled 15 text tokens, generated 18 speech tokens, current step (292 / 8192):   4%|▎         | 297/8192 [00:02<07:00, 18.79it/s]\n",
+            "Prefilled 20 text tokens, generated 18 speech tokens, current step (297 / 8192):   4%|▎         | 297/8192 [00:02<07:00, 18.79it/s]\n",
+            "Prefilled 20 text tokens, generated 19 speech tokens, current step (298 / 8192):   4%|▎         | 298/8192 [00:02<07:00, 18.79it/s]\n",
+            "Prefilled 20 text tokens, generated 20 speech tokens, current step (299 / 8192):   4%|▎         | 299/8192 [00:02<07:00, 18.79it/s]\n",
+            "Prefilled 20 text tokens, generated 20 speech tokens, current step (299 / 8192):   4%|▎         | 300/8192 [00:02<08:19, 15.80it/s]\n",
+            "Prefilled 20 text tokens, generated 21 speech tokens, current step (300 / 8192):   4%|▎         | 300/8192 [00:02<08:19, 15.80it/s]\n",
+            "Prefilled 20 text tokens, generated 22 speech tokens, current step (301 / 8192):   4%|▎         | 301/8192 [00:02<08:19, 15.80it/s]\n",
+            "Prefilled 20 text tokens, generated 22 speech tokens, current step (301 / 8192):   4%|▎         | 302/8192 [00:02<09:16, 14.17it/s]\n",
+            "Prefilled 20 text tokens, generated 23 speech tokens, current step (302 / 8192):   4%|▎         | 302/8192 [00:02<09:16, 14.17it/s]\n",
+            "Prefilled 20 text tokens, generated 24 speech tokens, current step (303 / 8192):   4%|▎         | 303/8192 [00:02<09:16, 14.17it/s]\n",
+            "Prefilled 20 text tokens, generated 24 speech tokens, current step (303 / 8192):   4%|▎         | 307/8192 [00:02<07:21, 17.88it/s]\n",
+            "Prefilled 24 text tokens, generated 24 speech tokens, current step (307 / 8192):   4%|▎         | 307/8192 [00:02<07:21, 17.88it/s]\n",
+            "Prefilled 24 text tokens, generated 25 speech tokens, current step (308 / 8192):   4%|▍         | 308/8192 [00:02<07:20, 17.88it/s]\n",
+            "Prefilled 24 text tokens, generated 26 speech tokens, current step (309 / 8192):   4%|▍         | 309/8192 [00:03<07:20, 17.88it/s]\n",
+            "Prefilled 24 text tokens, generated 26 speech tokens, current step (309 / 8192):   4%|▍         | 310/8192 [00:03<08:51, 14.83it/s]\n",
+            "Prefilled 24 text tokens, generated 27 speech tokens, current step (310 / 8192):   4%|▍         | 310/8192 [00:03<08:51, 14.83it/s]\n",
+            "Prefilled 24 text tokens, generated 28 speech tokens, current step (311 / 8192):   4%|▍         | 311/8192 [00:03<08:51, 14.83it/s]\n",
+            "Prefilled 24 text tokens, generated 28 speech tokens, current step (311 / 8192):   4%|▍         | 312/8192 [00:03<09:55, 13.24it/s]\n",
+            "Prefilled 24 text tokens, generated 29 speech tokens, current step (312 / 8192):   4%|▍         | 312/8192 [00:03<09:55, 13.24it/s]\n",
+            "Prefilled 24 text tokens, generated 30 speech tokens, current step (313 / 8192):   4%|▍         | 313/8192 [00:03<09:55, 13.24it/s]\n",
+            "Prefilled 24 text tokens, generated 30 speech tokens, current step (313 / 8192):   4%|▍         | 314/8192 [00:03<10:41, 12.28it/s]\n",
+            "Prefilled 24 text tokens, generated 31 speech tokens, current step (314 / 8192):   4%|▍         | 314/8192 [00:03<10:41, 12.28it/s]\n",
+            "Prefilled 24 text tokens, generated 32 speech tokens, current step (315 / 8192):   4%|▍         | 315/8192 [00:03<10:41, 12.28it/s]\n",
+            "Prefilled 24 text tokens, generated 32 speech tokens, current step (315 / 8192):   4%|▍         | 316/8192 [00:03<11:24, 11.51it/s]\n",
+            "Prefilled 24 text tokens, generated 33 speech tokens, current step (316 / 8192):   4%|▍         | 316/8192 [00:03<11:24, 11.51it/s]\n",
+            "Prefilled 24 text tokens, generated 34 speech tokens, current step (317 / 8192):   4%|▍         | 317/8192 [00:03<11:24, 11.51it/s]\n",
+            "Prefilled 24 text tokens, generated 34 speech tokens, current step (317 / 8192):   4%|▍         | 318/8192 [00:03<11:59, 10.95it/s]\n",
+            "Prefilled 24 text tokens, generated 35 speech tokens, current step (318 / 8192):   4%|▍         | 318/8192 [00:03<11:59, 10.95it/s]\n",
+            "Prefilled 24 text tokens, generated 36 speech tokens, current step (319 / 8192):   4%|▍         | 319/8192 [00:04<11:59, 10.95it/s]\n",
+            "Prefilled 24 text tokens, generated 36 speech tokens, current step (319 / 8192):   4%|▍         | 320/8192 [00:04<12:26, 10.55it/s]\n",
+            "Prefilled 24 text tokens, generated 37 speech tokens, current step (320 / 8192):   4%|▍         | 320/8192 [00:04<12:26, 10.55it/s]\n",
+            "Prefilled 24 text tokens, generated 38 speech tokens, current step (321 / 8192):   4%|▍         | 321/8192 [00:04<12:26, 10.55it/s]\n",
+            "Prefilled 24 text tokens, generated 38 speech tokens, current step (321 / 8192):   4%|▍         | 322/8192 [00:04<12:46, 10.27it/s]\n",
+            "Prefilled 24 text tokens, generated 39 speech tokens, current step (322 / 8192):   4%|▍         | 322/8192 [00:04<12:46, 10.27it/s]\n",
+            "Prefilled 24 text tokens, generated 40 speech tokens, current step (323 / 8192):   4%|▍         | 323/8192 [00:04<12:45, 10.27it/s]\n",
+            "Prefilled 24 text tokens, generated 40 speech tokens, current step (323 / 8192):   4%|▍         | 324/8192 [00:04<13:06, 10.00it/s]\n",
+            "Prefilled 24 text tokens, generated 41 speech tokens, current step (324 / 8192):   4%|▍         | 324/8192 [00:04<13:06, 10.00it/s]\n",
+            "Prefilled 24 text tokens, generated 42 speech tokens, current step (325 / 8192):   4%|▍         | 325/8192 [00:04<13:06, 10.00it/s]\n",
+            "Prefilled 24 text tokens, generated 42 speech tokens, current step (325 / 8192):   4%|▍         | 326/8192 [00:04<13:19,  9.84it/s]\n",
+            "Prefilled 24 text tokens, generated 43 speech tokens, current step (326 / 8192):   4%|▍         | 326/8192 [00:04<13:19,  9.84it/s]\n",
+            "Prefilled 24 text tokens, generated 43 speech tokens, current step (326 / 8192):   4%|▍         | 327/8192 [00:04<13:28,  9.72it/s]\n",
+            "Prefilled 24 text tokens, generated 44 speech tokens, current step (327 / 8192):   4%|▍         | 327/8192 [00:04<13:28,  9.72it/s]\n",
+            "Prefilled 24 text tokens, generated 44 speech tokens, current step (327 / 8192):   4%|▍         | 328/8192 [00:05<13:24,  9.77it/s]\n",
+            "Prefilled 24 text tokens, generated 45 speech tokens, current step (328 / 8192):   4%|▍         | 328/8192 [00:05<13:24,  9.77it/s]\n",
+            "Prefilled 24 text tokens, generated 45 speech tokens, current step (328 / 8192):   4%|▍         | 329/8192 [00:05<13:49,  9.48it/s]\n",
+            "Prefilled 24 text tokens, generated 46 speech tokens, current step (329 / 8192):   4%|▍         | 329/8192 [00:05<13:49,  9.48it/s]\n",
+            "Prefilled 24 text tokens, generated 46 speech tokens, current step (329 / 8192):   4%|▍         | 330/8192 [00:05<13:54,  9.42it/s]\n",
+            "Prefilled 24 text tokens, generated 47 speech tokens, current step (330 / 8192):   4%|▍         | 330/8192 [00:05<13:54,  9.42it/s]\n",
+            "Prefilled 24 text tokens, generated 47 speech tokens, current step (330 / 8192):   4%|▍         | 331/8192 [00:05<13:44,  9.53it/s]\n",
+            "Prefilled 24 text tokens, generated 48 speech tokens, current step (331 / 8192):   4%|▍         | 331/8192 [00:05<13:44,  9.53it/s]\n",
+            "Prefilled 24 text tokens, generated 48 speech tokens, current step (331 / 8192):   4%|▍         | 332/8192 [00:05<13:35,  9.63it/s]\n",
+            "Prefilled 24 text tokens, generated 49 speech tokens, current step (332 / 8192):   4%|▍         | 332/8192 [00:05<13:35,  9.63it/s]\n",
+            "Prefilled 24 text tokens, generated 49 speech tokens, current step (332 / 8192):   4%|▍         | 333/8192 [00:05<13:36,  9.63it/s]\n",
+            "Prefilled 24 text tokens, generated 50 speech tokens, current step (333 / 8192):   4%|▍         | 333/8192 [00:05<13:36,  9.63it/s]\n",
+            "Prefilled 24 text tokens, generated 50 speech tokens, current step (333 / 8192):   4%|▍         | 334/8192 [00:05<13:40,  9.57it/s]\n",
+            "Prefilled 24 text tokens, generated 51 speech tokens, current step (334 / 8192):   4%|▍         | 334/8192 [00:05<13:40,  9.57it/s]\n",
+            "Prefilled 24 text tokens, generated 51 speech tokens, current step (334 / 8192):   4%|▍         | 335/8192 [00:05<13:43,  9.54it/s]\n",
+            "Prefilled 24 text tokens, generated 52 speech tokens, current step (335 / 8192):   4%|▍         | 335/8192 [00:05<13:43,  9.54it/s]\n",
+            "Prefilled 24 text tokens, generated 52 speech tokens, current step (335 / 8192):   4%|▍         | 336/8192 [00:05<13:41,  9.56it/s]\n",
+            "Prefilled 24 text tokens, generated 53 speech tokens, current step (336 / 8192):   4%|▍         | 336/8192 [00:05<13:41,  9.56it/s]\n",
+            "Prefilled 24 text tokens, generated 53 speech tokens, current step (336 / 8192):   4%|▍         | 337/8192 [00:05<13:40,  9.57it/s]\n",
+            "Prefilled 24 text tokens, generated 54 speech tokens, current step (337 / 8192):   4%|▍         | 337/8192 [00:05<13:40,  9.57it/s]\n",
+            "Prefilled 24 text tokens, generated 54 speech tokens, current step (337 / 8192):   4%|▍         | 338/8192 [00:06<13:33,  9.65it/s]\n",
+            "Prefilled 24 text tokens, generated 55 speech tokens, current step (338 / 8192):   4%|▍         | 338/8192 [00:06<13:33,  9.65it/s]\n",
+            "Prefilled 24 text tokens, generated 55 speech tokens, current step (338 / 8192):   4%|▍         | 339/8192 [00:06<14:16,  9.17it/s]\n",
+            "Prefilled 24 text tokens, generated 56 speech tokens, current step (339 / 8192):   4%|▍         | 339/8192 [00:06<14:16,  9.17it/s]\n",
+            "Prefilled 24 text tokens, generated 56 speech tokens, current step (339 / 8192):   4%|▍         | 340/8192 [00:06<14:09,  9.24it/s]\n",
+            "Prefilled 24 text tokens, generated 57 speech tokens, current step (340 / 8192):   4%|▍         | 340/8192 [00:06<14:09,  9.24it/s]\n",
+            "Prefilled 24 text tokens, generated 57 speech tokens, current step (340 / 8192):   4%|▍         | 341/8192 [00:06<13:57,  9.37it/s]\n",
+            "Prefilled 24 text tokens, generated 58 speech tokens, current step (341 / 8192):   4%|▍         | 341/8192 [00:06<13:57,  9.37it/s]\n",
+            "Prefilled 24 text tokens, generated 59 speech tokens, current step (342 / 8192):   4%|▍         | 342/8192 [00:06<13:57,  9.37it/s]\n",
+            "Prefilled 24 text tokens, generated 59 speech tokens, current step (342 / 8192):   4%|▍         | 343/8192 [00:06<13:29,  9.69it/s]\n",
+            "Prefilled 24 text tokens, generated 60 speech tokens, current step (343 / 8192):   4%|▍         | 343/8192 [00:06<13:29,  9.69it/s]\n",
+            "\n",
+            "INFO:     connection closed\n",
+            "INFO:     2804:b14:8104:2d70:5108:55d0:5e0a:75b4:0 - \"WebSocket /stream?text=Enter+your+text+here+and+click+%22Start%22+to+instantly+hear+the+VibeVoice-Realtime+TTS+output+audio.&cfg=1.500&steps=5&voice=pt-Spk1_man\" [accepted]\n",
+            "INFO:     connection open\n",
+            "WS handler exit\n",
+            "Client connected, text='Enter your text here and click \"Start\" to instantly hear the VibeVoice-Realtime TTS output audio.'\n",
+            "\n",
+            "Prefilled 259 tokens, current step (259 / 8192):   3%|▎         | 259/8192 [00:00<?, ?it/s]\n",
+            "Prefilled 5 text tokens, generated 0 speech tokens, current step (264 / 8192):   3%|▎         | 264/8192 [00:00<00:00, 32665.92it/s]\n",
+            "Prefilled 5 text tokens, generated 0 speech tokens, current step (264 / 8192):   3%|▎         | 265/8192 [00:00<03:28, 38.04it/s]\n",
+            "Prefilled 5 text tokens, generated 1 speech tokens, current step (265 / 8192):   3%|▎         | 265/8192 [00:00<03:28, 38.04it/s]\n",
+            "Prefilled 5 text tokens, generated 2 speech tokens, current step (266 / 8192):   3%|▎         | 266/8192 [00:00<03:28, 38.04it/s]\n",
+            "Prefilled 5 text tokens, generated 3 speech tokens, current step (267 / 8192):   3%|▎         | 267/8192 [00:00<03:28, 38.04it/s]\n",
+            "Prefilled 5 text tokens, generated 4 speech tokens, current step (268 / 8192):   3%|▎         | 268/8192 [00:00<03:28, 38.04it/s]\n",
+            "Prefilled 5 text tokens, generated 4 speech tokens, current step (268 / 8192):   3%|▎         | 269/8192 [00:00<09:39, 13.67it/s]\n",
+            "Prefilled 5 text tokens, generated 5 speech tokens, current step (269 / 8192):   3%|▎         | 269/8192 [00:00<09:39, 13.67it/s]\n",
+            "Prefilled 5 text tokens, generated 6 speech tokens, current step (270 / 8192):   3%|▎         | 270/8192 [00:00<09:39, 13.67it/s]\n",
+            "Prefilled 5 text tokens, generated 6 speech tokens, current step (270 / 8192):   3%|▎         | 275/8192 [00:00<06:36, 19.96it/s]\n",
+            "Prefilled 10 text tokens, generated 6 speech tokens, current step (275 / 8192):   3%|▎         | 275/8192 [00:00<06:36, 19.96it/s]\n",
+            "Prefilled 10 text tokens, generated 7 speech tokens, current step (276 / 8192):   3%|▎         | 276/8192 [00:00<06:36, 19.96it/s]\n",
+            "Prefilled 10 text tokens, generated 8 speech tokens, current step (277 / 8192):   3%|▎         | 277/8192 [00:01<06:36, 19.96it/s]\n",
+            "Prefilled 10 text tokens, generated 8 speech tokens, current step (277 / 8192):   3%|▎         | 278/8192 [00:01<08:25, 15.67it/s]\n",
+            "Prefilled 10 text tokens, generated 9 speech tokens, current step (278 / 8192):   3%|▎         | 278/8192 [00:01<08:25, 15.67it/s]\n",
+            "Prefilled 10 text tokens, generated 10 speech tokens, current step (279 / 8192):   3%|▎         | 279/8192 [00:01<08:25, 15.67it/s]\n",
+            "Prefilled 10 text tokens, generated 11 speech tokens, current step (280 / 8192):   3%|▎         | 280/8192 [00:01<08:24, 15.67it/s]\n",
+            "Prefilled 10 text tokens, generated 11 speech tokens, current step (280 / 8192):   3%|▎         | 281/8192 [00:01<10:02, 13.13it/s]\n",
+            "Prefilled 10 text tokens, generated 12 speech tokens, current step (281 / 8192):   3%|▎         | 281/8192 [00:01<10:02, 13.13it/s]\n",
+            "Prefilled 15 text tokens, generated 12 speech tokens, current step (286 / 8192):   3%|▎         | 286/8192 [00:01<10:02, 13.13it/s]\n",
+            "Prefilled 15 text tokens, generated 12 speech tokens, current step (286 / 8192):   4%|▎         | 287/8192 [00:01<06:59, 18.84it/s]\n",
+            "Prefilled 15 text tokens, generated 13 speech tokens, current step (287 / 8192):   4%|▎         | 287/8192 [00:01<06:59, 18.84it/s]\n",
+            "Prefilled 15 text tokens, generated 14 speech tokens, current step (288 / 8192):   4%|▎         | 288/8192 [00:01<06:59, 18.84it/s]\n",
+            "Prefilled 15 text tokens, generated 15 speech tokens, current step (289 / 8192):   4%|▎         | 289/8192 [00:01<06:59, 18.84it/s]\n",
+            "Prefilled 15 text tokens, generated 15 speech tokens, current step (289 / 8192):   4%|▎         | 290/8192 [00:01<08:37, 15.26it/s]\n",
+            "Prefilled 15 text tokens, generated 16 speech tokens, current step (290 / 8192):   4%|▎         | 290/8192 [00:01<08:37, 15.26it/s]\n",
+            "Prefilled 15 text tokens, generated 17 speech tokens, current step (291 / 8192):   4%|▎         | 291/8192 [00:02<08:37, 15.26it/s]\n",
+            "Prefilled 15 text tokens, generated 17 speech tokens, current step (291 / 8192):   4%|▎         | 292/8192 [00:02<09:39, 13.63it/s]\n",
+            "Prefilled 15 text tokens, generated 18 speech tokens, current step (292 / 8192):   4%|▎         | 292/8192 [00:02<09:39, 13.63it/s]\n",
+            "Prefilled 20 text tokens, generated 18 speech tokens, current step (297 / 8192):   4%|▎         | 297/8192 [00:02<09:39, 13.63it/s]\n",
+            "Prefilled 20 text tokens, generated 18 speech tokens, current step (297 / 8192):   4%|▎         | 298/8192 [00:02<06:45, 19.45it/s]\n",
+            "Prefilled 20 text tokens, generated 19 speech tokens, current step (298 / 8192):   4%|▎         | 298/8192 [00:02<06:45, 19.45it/s]\n",
+            "Prefilled 20 text tokens, generated 20 speech tokens, current step (299 / 8192):   4%|▎         | 299/8192 [00:02<06:45, 19.45it/s]\n",
+            "Prefilled 20 text tokens, generated 21 speech tokens, current step (300 / 8192):   4%|▎         | 300/8192 [00:02<06:45, 19.45it/s]\n",
+            "Prefilled 20 text tokens, generated 21 speech tokens, current step (300 / 8192):   4%|▎         | 301/8192 [00:02<08:35, 15.30it/s]\n",
+            "Prefilled 20 text tokens, generated 22 speech tokens, current step (301 / 8192):   4%|▎         | 301/8192 [00:02<08:35, 15.30it/s]\n",
+            "Prefilled 20 text tokens, generated 23 speech tokens, current step (302 / 8192):   4%|▎         | 302/8192 [00:02<08:35, 15.30it/s]\n",
+            "Prefilled 20 text tokens, generated 23 speech tokens, current step (302 / 8192):   4%|▎         | 303/8192 [00:02<09:32, 13.77it/s]\n",
+            "Prefilled 20 text tokens, generated 24 speech tokens, current step (303 / 8192):   4%|▎         | 303/8192 [00:02<09:32, 13.77it/s]\n",
+            "Prefilled 24 text tokens, generated 24 speech tokens, current step (307 / 8192):   4%|▎         | 307/8192 [00:02<09:32, 13.77it/s]\n",
+            "Prefilled 24 text tokens, generated 24 speech tokens, current step (307 / 8192):   4%|▍         | 308/8192 [00:02<07:11, 18.29it/s]\n",
+            "Prefilled 24 text tokens, generated 25 speech tokens, current step (308 / 8192):   4%|▍         | 308/8192 [00:02<07:11, 18.29it/s]\n",
+            "Prefilled 24 text tokens, generated 26 speech tokens, current step (309 / 8192):   4%|▍         | 309/8192 [00:03<07:11, 18.29it/s]\n",
+            "Prefilled 24 text tokens, generated 27 speech tokens, current step (310 / 8192):   4%|▍         | 310/8192 [00:03<07:10, 18.29it/s]\n",
+            "Prefilled 24 text tokens, generated 27 speech tokens, current step (310 / 8192):   4%|▍         | 311/8192 [00:03<08:53, 14.76it/s]\n",
+            "Prefilled 24 text tokens, generated 28 speech tokens, current step (311 / 8192):   4%|▍         | 311/8192 [00:03<08:53, 14.76it/s]\n",
+            "Prefilled 24 text tokens, generated 29 speech tokens, current step (312 / 8192):   4%|▍         | 312/8192 [00:03<08:53, 14.76it/s]\n",
+            "Prefilled 24 text tokens, generated 29 speech tokens, current step (312 / 8192):   4%|▍         | 313/8192 [00:03<09:58, 13.15it/s]\n",
+            "Prefilled 24 text tokens, generated 30 speech tokens, current step (313 / 8192):   4%|▍         | 313/8192 [00:03<09:58, 13.15it/s]\n",
+            "Prefilled 24 text tokens, generated 31 speech tokens, current step (314 / 8192):   4%|▍         | 314/8192 [00:03<09:58, 13.15it/s]\n",
+            "Prefilled 24 text tokens, generated 31 speech tokens, current step (314 / 8192):   4%|▍         | 315/8192 [00:03<10:42, 12.27it/s]\n",
+            "Prefilled 24 text tokens, generated 32 speech tokens, current step (315 / 8192):   4%|▍         | 315/8192 [00:03<10:42, 12.27it/s]\n",
+            "Prefilled 24 text tokens, generated 33 speech tokens, current step (316 / 8192):   4%|▍         | 316/8192 [00:03<10:42, 12.27it/s]\n",
+            "Prefilled 24 text tokens, generated 33 speech tokens, current step (316 / 8192):   4%|▍         | 317/8192 [00:03<11:20, 11.57it/s]\n",
+            "Prefilled 24 text tokens, generated 34 speech tokens, current step (317 / 8192):   4%|▍         | 317/8192 [00:03<11:20, 11.57it/s]\n",
+            "Prefilled 24 text tokens, generated 35 speech tokens, current step (318 / 8192):   4%|▍         | 318/8192 [00:03<11:20, 11.57it/s]\n",
+            "Prefilled 24 text tokens, generated 35 speech tokens, current step (318 / 8192):   4%|▍         | 319/8192 [00:04<11:50, 11.09it/s]\n",
+            "Prefilled 24 text tokens, generated 36 speech tokens, current step (319 / 8192):   4%|▍         | 319/8192 [00:04<11:50, 11.09it/s]\n",
+            "Prefilled 24 text tokens, generated 37 speech tokens, current step (320 / 8192):   4%|▍         | 320/8192 [00:04<11:50, 11.09it/s]\n",
+            "Prefilled 24 text tokens, generated 37 speech tokens, current step (320 / 8192):   4%|▍         | 321/8192 [00:04<12:21, 10.61it/s]\n",
+            "Prefilled 24 text tokens, generated 38 speech tokens, current step (321 / 8192):   4%|▍         | 321/8192 [00:04<12:21, 10.61it/s]\n",
+            "Prefilled 24 text tokens, generated 39 speech tokens, current step (322 / 8192):   4%|▍         | 322/8192 [00:04<12:21, 10.61it/s]\n",
+            "Prefilled 24 text tokens, generated 39 speech tokens, current step (322 / 8192):   4%|▍         | 323/8192 [00:04<13:00, 10.09it/s]\n",
+            "Prefilled 24 text tokens, generated 40 speech tokens, current step (323 / 8192):   4%|▍         | 323/8192 [00:04<13:00, 10.09it/s]\n",
+            "Prefilled 24 text tokens, generated 41 speech tokens, current step (324 / 8192):   4%|▍         | 324/8192 [00:04<12:59, 10.09it/s]\n",
+            "Prefilled 24 text tokens, generated 41 speech tokens, current step (324 / 8192):   4%|▍         | 325/8192 [00:04<13:17,  9.87it/s]\n",
+            "Prefilled 24 text tokens, generated 42 speech tokens, current step (325 / 8192):   4%|▍         | 325/8192 [00:04<13:17,  9.87it/s]\n",
+            "Prefilled 24 text tokens, generated 43 speech tokens, current step (326 / 8192):   4%|▍         | 326/8192 [00:04<13:17,  9.87it/s]\n",
+            "Prefilled 24 text tokens, generated 43 speech tokens, current step (326 / 8192):   4%|▍         | 327/8192 [00:04<13:13,  9.91it/s]\n",
+            "Prefilled 24 text tokens, generated 44 speech tokens, current step (327 / 8192):   4%|▍         | 327/8192 [00:04<13:13,  9.91it/s]\n",
+            "Prefilled 24 text tokens, generated 45 speech tokens, current step (328 / 8192):   4%|▍         | 328/8192 [00:05<13:13,  9.91it/s]\n",
+            "Prefilled 24 text tokens, generated 45 speech tokens, current step (328 / 8192):   4%|▍         | 329/8192 [00:05<13:18,  9.85it/s]\n",
+            "Prefilled 24 text tokens, generated 46 speech tokens, current step (329 / 8192):   4%|▍         | 329/8192 [00:05<13:18,  9.85it/s]\n",
+            "Prefilled 24 text tokens, generated 47 speech tokens, current step (330 / 8192):   4%|▍         | 330/8192 [00:05<13:18,  9.85it/s]\n",
+            "Prefilled 24 text tokens, generated 47 speech tokens, current step (330 / 8192):   4%|▍         | 331/8192 [00:05<13:08,  9.98it/s]\n",
+            "Prefilled 24 text tokens, generated 48 speech tokens, current step (331 / 8192):   4%|▍         | 331/8192 [00:05<13:08,  9.98it/s]\n",
+            "\n",
+            "INFO:     connection closed\n",
+            "INFO:     2804:b14:8104:2d70:5108:55d0:5e0a:75b4:0 - \"WebSocket /stream?text=Eu+consigo+falar+aqui+por+texto+e+me+falando+e+falando+e+a%C3%AD+vai+pegar+e+vai+passar+por+algum+outro+tipo+de+an%C3%A1lise+ou+n%C3%A3o+%C3%A9+s%C3%B3+%0A&cfg=1.500&steps=5&voice=pt-Spk1_man\" [accepted]\n",
+            "INFO:     connection open\n",
+            "WS handler exit\n",
+            "Client connected, text='Eu consigo falar aqui por texto e me falando e falando e aí vai pegar e vai passar por algum outro tipo de análise ou não é só \\n'\n",
+            "\n",
+            "Prefilled 259 tokens, current step (259 / 8192):   3%|▎         | 259/8192 [00:00<?, ?it/s]\n",
+            "Prefilled 5 text tokens, generated 0 speech tokens, current step (264 / 8192):   3%|▎         | 264/8192 [00:00<00:00, 31536.12it/s]\n",
+            "Prefilled 5 text tokens, generated 0 speech tokens, current step (264 / 8192):   3%|▎         | 265/8192 [00:00<03:31, 37.48it/s]\n",
+            "Prefilled 5 text tokens, generated 1 speech tokens, current step (265 / 8192):   3%|▎         | 265/8192 [00:00<03:31, 37.48it/s]\n",
+            "Prefilled 5 text tokens, generated 2 speech tokens, current step (266 / 8192):   3%|▎         | 266/8192 [00:00<03:31, 37.48it/s]\n",
+            "Prefilled 5 text tokens, generated 3 speech tokens, current step (267 / 8192):   3%|▎         | 267/8192 [00:00<03:31, 37.48it/s]\n",
+            "Prefilled 5 text tokens, generated 4 speech tokens, current step (268 / 8192):   3%|▎         | 268/8192 [00:00<03:31, 37.48it/s]\n",
+            "Prefilled 5 text tokens, generated 4 speech tokens, current step (268 / 8192):   3%|▎         | 269/8192 [00:00<09:40, 13.66it/s]\n",
+            "Prefilled 5 text tokens, generated 5 speech tokens, current step (269 / 8192):   3%|▎         | 269/8192 [00:00<09:40, 13.66it/s]\n",
+            "Prefilled 5 text tokens, generated 6 speech tokens, current step (270 / 8192):   3%|▎         | 270/8192 [00:00<09:40, 13.66it/s]\n",
+            "Prefilled 5 text tokens, generated 6 speech tokens, current step (270 / 8192):   3%|▎         | 275/8192 [00:00<06:36, 19.96it/s]\n",
+            "Prefilled 10 text tokens, generated 6 speech tokens, current step (275 / 8192):   3%|▎         | 275/8192 [00:00<06:36, 19.96it/s]\n",
+            "Prefilled 10 text tokens, generated 7 speech tokens, current step (276 / 8192):   3%|▎         | 276/8192 [00:00<06:36, 19.96it/s]\n",
+            "Prefilled 10 text tokens, generated 8 speech tokens, current step (277 / 8192):   3%|▎         | 277/8192 [00:01<06:36, 19.96it/s]\n",
+            "Prefilled 10 text tokens, generated 8 speech tokens, current step (277 / 8192):   3%|▎         | 278/8192 [00:01<08:30, 15.50it/s]\n",
+            "Prefilled 10 text tokens, generated 9 speech tokens, current step (278 / 8192):   3%|▎         | 278/8192 [00:01<08:30, 15.50it/s]\n",
+            "Prefilled 10 text tokens, generated 10 speech tokens, current step (279 / 8192):   3%|▎         | 279/8192 [00:01<08:30, 15.50it/s]\n",
+            "Prefilled 10 text tokens, generated 11 speech tokens, current step (280 / 8192):   3%|▎         | 280/8192 [00:01<08:30, 15.50it/s]\n",
+            "Prefilled 10 text tokens, generated 11 speech tokens, current step (280 / 8192):   3%|▎         | 281/8192 [00:01<10:06, 13.04it/s]\n",
+            "Prefilled 10 text tokens, generated 12 speech tokens, current step (281 / 8192):   3%|▎         | 281/8192 [00:01<10:06, 13.04it/s]\n",
+            "Prefilled 15 text tokens, generated 12 speech tokens, current step (286 / 8192):   3%|▎         | 286/8192 [00:01<10:06, 13.04it/s]\n",
+            "Prefilled 15 text tokens, generated 12 speech tokens, current step (286 / 8192):   4%|▎         | 287/8192 [00:01<07:02, 18.72it/s]\n",
+            "Prefilled 15 text tokens, generated 13 speech tokens, current step (287 / 8192):   4%|▎         | 287/8192 [00:01<07:02, 18.72it/s]\n",
+            "Prefilled 15 text tokens, generated 14 speech tokens, current step (288 / 8192):   4%|▎         | 288/8192 [00:01<07:02, 18.72it/s]\n",
+            "Prefilled 15 text tokens, generated 15 speech tokens, current step (289 / 8192):   4%|▎         | 289/8192 [00:01<07:02, 18.72it/s]\n",
+            "Prefilled 15 text tokens, generated 15 speech tokens, current step (289 / 8192):   4%|▎         | 290/8192 [00:01<08:46, 15.00it/s]\n",
+            "Prefilled 15 text tokens, generated 16 speech tokens, current step (290 / 8192):   4%|▎         | 290/8192 [00:01<08:46, 15.00it/s]\n",
+            "Prefilled 15 text tokens, generated 17 speech tokens, current step (291 / 8192):   4%|▎         | 291/8192 [00:02<08:46, 15.00it/s]\n",
+            "Prefilled 15 text tokens, generated 17 speech tokens, current step (291 / 8192):   4%|▎         | 292/8192 [00:02<09:46, 13.46it/s]\n",
+            "Prefilled 15 text tokens, generated 18 speech tokens, current step (292 / 8192):   4%|▎         | 292/8192 [00:02<09:46, 13.46it/s]\n",
+            "Prefilled 20 text tokens, generated 18 speech tokens, current step (297 / 8192):   4%|▎         | 297/8192 [00:02<09:46, 13.46it/s]\n",
+            "Prefilled 20 text tokens, generated 18 speech tokens, current step (297 / 8192):   4%|▎         | 298/8192 [00:02<06:51, 19.19it/s]\n",
+            "Prefilled 20 text tokens, generated 19 speech tokens, current step (298 / 8192):   4%|▎         | 298/8192 [00:02<06:51, 19.19it/s]\n",
+            "Prefilled 20 text tokens, generated 20 speech tokens, current step (299 / 8192):   4%|▎         | 299/8192 [00:02<06:51, 19.19it/s]\n",
+            "Prefilled 20 text tokens, generated 21 speech tokens, current step (300 / 8192):   4%|▎         | 300/8192 [00:02<06:51, 19.19it/s]\n",
+            "Prefilled 20 text tokens, generated 21 speech tokens, current step (300 / 8192):   4%|▎         | 301/8192 [00:02<08:41, 15.14it/s]\n",
+            "Prefilled 20 text tokens, generated 22 speech tokens, current step (301 / 8192):   4%|▎         | 301/8192 [00:02<08:41, 15.14it/s]\n",
+            "Prefilled 20 text tokens, generated 23 speech tokens, current step (302 / 8192):   4%|▎         | 302/8192 [00:02<08:41, 15.14it/s]\n",
+            "Prefilled 20 text tokens, generated 23 speech tokens, current step (302 / 8192):   4%|▎         | 303/8192 [00:02<09:37, 13.66it/s]\n",
+            "Prefilled 20 text tokens, generated 24 speech tokens, current step (303 / 8192):   4%|▎         | 303/8192 [00:02<09:37, 13.66it/s]\n",
+            "Prefilled 25 text tokens, generated 24 speech tokens, current step (308 / 8192):   4%|▍         | 308/8192 [00:02<09:37, 13.66it/s]\n",
+            "Prefilled 25 text tokens, generated 24 speech tokens, current step (308 / 8192):   4%|▍         | 309/8192 [00:02<06:41, 19.65it/s]\n",
+            "Prefilled 25 text tokens, generated 25 speech tokens, current step (309 / 8192):   4%|▍         | 309/8192 [00:02<06:41, 19.65it/s]\n",
+            "Prefilled 25 text tokens, generated 26 speech tokens, current step (310 / 8192):   4%|▍         | 310/8192 [00:03<06:41, 19.65it/s]\n",
+            "Prefilled 25 text tokens, generated 27 speech tokens, current step (311 / 8192):   4%|▍         | 311/8192 [00:03<06:41, 19.65it/s]\n",
+            "Prefilled 25 text tokens, generated 27 speech tokens, current step (311 / 8192):   4%|▍         | 312/8192 [00:03<08:45, 14.99it/s]\n",
+            "Prefilled 25 text tokens, generated 28 speech tokens, current step (312 / 8192):   4%|▍         | 312/8192 [00:03<08:45, 14.99it/s]\n",
+            "Prefilled 25 text tokens, generated 29 speech tokens, current step (313 / 8192):   4%|▍         | 313/8192 [00:03<08:45, 14.99it/s]\n",
+            "Prefilled 25 text tokens, generated 29 speech tokens, current step (313 / 8192):   4%|▍         | 314/8192 [00:03<09:45, 13.46it/s]\n",
+            "Prefilled 25 text tokens, generated 30 speech tokens, current step (314 / 8192):   4%|▍         | 314/8192 [00:03<09:45, 13.46it/s]\n",
+            "Prefilled 30 text tokens, generated 30 speech tokens, current step (319 / 8192):   4%|▍         | 319/8192 [00:03<09:44, 13.46it/s]\n",
+            "Prefilled 30 text tokens, generated 30 speech tokens, current step (319 / 8192):   4%|▍         | 320/8192 [00:03<06:45, 19.42it/s]\n",
+            "Prefilled 30 text tokens, generated 31 speech tokens, current step (320 / 8192):   4%|▍         | 320/8192 [00:03<06:45, 19.42it/s]\n",
+            "Prefilled 30 text tokens, generated 32 speech tokens, current step (321 / 8192):   4%|▍         | 321/8192 [00:03<06:45, 19.42it/s]\n",
+            "Prefilled 30 text tokens, generated 33 speech tokens, current step (322 / 8192):   4%|▍         | 322/8192 [00:03<06:45, 19.42it/s]\n",
+            "Prefilled 30 text tokens, generated 33 speech tokens, current step (322 / 8192):   4%|▍         | 323/8192 [00:03<08:28, 15.47it/s]\n",
+            "Prefilled 30 text tokens, generated 34 speech tokens, current step (323 / 8192):   4%|▍         | 323/8192 [00:03<08:28, 15.47it/s]\n",
+            "Prefilled 30 text tokens, generated 35 speech tokens, current step (324 / 8192):   4%|▍         | 324/8192 [00:04<08:28, 15.47it/s]\n",
+            "Prefilled 30 text tokens, generated 36 speech tokens, current step (325 / 8192):   4%|▍         | 325/8192 [00:04<08:28, 15.47it/s]\n",
+            "Prefilled 30 text tokens, generated 36 speech tokens, current step (325 / 8192):   4%|▍         | 330/8192 [00:04<06:56, 18.89it/s]\n",
+            "Prefilled 35 text tokens, generated 36 speech tokens, current step (330 / 8192):   4%|▍         | 330/8192 [00:04<06:56, 18.89it/s]\n",
+            "Prefilled 35 text tokens, generated 37 speech tokens, current step (331 / 8192):   4%|▍         | 331/8192 [00:04<06:56, 18.89it/s]\n",
+            "Prefilled 35 text tokens, generated 38 speech tokens, current step (332 / 8192):   4%|▍         | 332/8192 [00:04<06:56, 18.89it/s]\n",
+            "Prefilled 35 text tokens, generated 38 speech tokens, current step (332 / 8192):   4%|▍         | 333/8192 [00:04<08:19, 15.73it/s]\n",
+            "Prefilled 35 text tokens, generated 39 speech tokens, current step (333 / 8192):   4%|▍         | 333/8192 [00:04<08:19, 15.73it/s]\n",
+            "Prefilled 35 text tokens, generated 40 speech tokens, current step (334 / 8192):   4%|▍         | 334/8192 [00:04<08:19, 15.73it/s]\n",
+            "Prefilled 35 text tokens, generated 40 speech tokens, current step (334 / 8192):   4%|▍         | 335/8192 [00:04<09:08, 14.32it/s]\n",
+            "Prefilled 35 text tokens, generated 41 speech tokens, current step (335 / 8192):   4%|▍         | 335/8192 [00:04<09:08, 14.32it/s]\n",
+            "Prefilled 35 text tokens, generated 42 speech tokens, current step (336 / 8192):   4%|▍         | 336/8192 [00:04<09:08, 14.32it/s]\n",
+            "Prefilled 35 text tokens, generated 42 speech tokens, current step (336 / 8192):   4%|▍         | 337/8192 [00:04<09:24, 13.92it/s]\n",
+            "Prefilled 36 text tokens, generated 42 speech tokens, current step (337 / 8192):   4%|▍         | 337/8192 [00:04<09:24, 13.92it/s]\n",
+            "Prefilled 36 text tokens, generated 43 speech tokens, current step (338 / 8192):   4%|▍         | 338/8192 [00:05<09:24, 13.92it/s]\n",
+            "Prefilled 36 text tokens, generated 43 speech tokens, current step (338 / 8192):   4%|▍         | 339/8192 [00:05<10:04, 12.98it/s]\n",
+            "Prefilled 36 text tokens, generated 44 speech tokens, current step (339 / 8192):   4%|▍         | 339/8192 [00:05<10:04, 12.98it/s]\n",
+            "Prefilled 36 text tokens, generated 45 speech tokens, current step (340 / 8192):   4%|▍         | 340/8192 [00:05<10:04, 12.98it/s]\n",
+            "Prefilled 36 text tokens, generated 45 speech tokens, current step (340 / 8192):   4%|▍         | 341/8192 [00:05<10:59, 11.90it/s]\n",
+            "Prefilled 36 text tokens, generated 46 speech tokens, current step (341 / 8192):   4%|▍         | 341/8192 [00:05<10:59, 11.90it/s]\n",
+            "Prefilled 36 text tokens, generated 47 speech tokens, current step (342 / 8192):   4%|▍         | 342/8192 [00:05<10:59, 11.90it/s]\n",
+            "Prefilled 36 text tokens, generated 47 speech tokens, current step (342 / 8192):   4%|▍         | 343/8192 [00:05<11:58, 10.92it/s]\n",
+            "Prefilled 36 text tokens, generated 48 speech tokens, current step (343 / 8192):   4%|▍         | 343/8192 [00:05<11:58, 10.92it/s]\n",
+            "Prefilled 36 text tokens, generated 49 speech tokens, current step (344 / 8192):   4%|▍         | 344/8192 [00:05<11:58, 10.92it/s]\n",
+            "Prefilled 36 text tokens, generated 49 speech tokens, current step (344 / 8192):   4%|▍         | 345/8192 [00:05<12:24, 10.53it/s]\n",
+            "Prefilled 36 text tokens, generated 50 speech tokens, current step (345 / 8192):   4%|▍         | 345/8192 [00:05<12:24, 10.53it/s]\n",
+            "Prefilled 36 text tokens, generated 51 speech tokens, current step (346 / 8192):   4%|▍         | 346/8192 [00:05<12:24, 10.53it/s]\n",
+            "Prefilled 36 text tokens, generated 51 speech tokens, current step (346 / 8192):   4%|▍         | 347/8192 [00:05<12:39, 10.33it/s]\n",
+            "Prefilled 36 text tokens, generated 52 speech tokens, current step (347 / 8192):   4%|▍         | 347/8192 [00:05<12:39, 10.33it/s]\n",
+            "Prefilled 36 text tokens, generated 53 speech tokens, current step (348 / 8192):   4%|▍         | 348/8192 [00:06<12:39, 10.33it/s]\n",
+            "Prefilled 36 text tokens, generated 53 speech tokens, current step (348 / 8192):   4%|▍         | 349/8192 [00:06<12:56, 10.10it/s]\n",
+            "Prefilled 36 text tokens, generated 54 speech tokens, current step (349 / 8192):   4%|▍         | 349/8192 [00:06<12:56, 10.10it/s]\n",
+            "\n",
+            "INFO:     connection closed\n",
+            "INFO:     2804:b14:8104:2d70:5108:55d0:5e0a:75b4:0 - \"WebSocket /stream?text=Esse+modo+de+vibra%C3%A7%C3%A3o+viber+code+vai+ser+muito+muito+interessante+porque+d%C3%A1+para+eu+organizar+todas+as+ideias+do+caderno+da+cabe%C3%A7a+de+qualquer+lugar+s%C3%B3+usando+isso+aqui+como+backlog+o+meu+backlog+ia+ser+o+backlog+Premiere+talvez+ainda+seja+esse+esse+neg%C3%B3cio+por%C3%A9m+agora+eu+vou+realmente+focar+mais+de+couro+hein+%0A&cfg=2.000&steps=5&voice=pt-Spk1_man\" [accepted]\n",
+            "INFO:     connection open\n",
+            "WS handler exit\n",
+            "Client connected, text='Esse modo de vibração viber code vai ser muito muito interessante porque dá para eu organizar todas as ideias do caderno da cabeça de qualquer lugar só usando isso aqui como backlog o meu backlog ia ser o backlog Premiere talvez ainda seja esse esse negócio porém agora eu vou realmente focar mais de couro hein \\n'\n",
+            "\n",
+            "Prefilled 259 tokens, current step (259 / 8192):   3%|▎         | 259/8192 [00:00<?, ?it/s]\n",
+            "Prefilled 5 text tokens, generated 0 speech tokens, current step (264 / 8192):   3%|▎         | 264/8192 [00:00<00:00, 32017.59it/s]\n",
+            "Prefilled 5 text tokens, generated 0 speech tokens, current step (264 / 8192):   3%|▎         | 265/8192 [00:00<03:22, 39.12it/s]\n",
+            "Prefilled 5 text tokens, generated 1 speech tokens, current step (265 / 8192):   3%|▎         | 265/8192 [00:00<03:22, 39.12it/s]\n",
+            "Prefilled 5 text tokens, generated 2 speech tokens, current step (266 / 8192):   3%|▎         | 266/8192 [00:00<03:22, 39.12it/s]\n",
+            "Prefilled 5 text tokens, generated 3 speech tokens, current step (267 / 8192):   3%|▎         | 267/8192 [00:00<03:22, 39.12it/s]\n",
+            "Prefilled 5 text tokens, generated 4 speech tokens, current step (268 / 8192):   3%|▎         | 268/8192 [00:00<03:22, 39.12it/s]\n",
+            "Prefilled 5 text tokens, generated 4 speech tokens, current step (268 / 8192):   3%|▎         | 269/8192 [00:00<09:14, 14.28it/s]\n",
+            "Prefilled 5 text tokens, generated 5 speech tokens, current step (269 / 8192):   3%|▎         | 269/8192 [00:00<09:14, 14.28it/s]\n",
+            "Prefilled 5 text tokens, generated 6 speech tokens, current step (270 / 8192):   3%|▎         | 270/8192 [00:00<09:14, 14.28it/s]\n",
+            "Prefilled 5 text tokens, generated 6 speech tokens, current step (270 / 8192):   3%|▎         | 275/8192 [00:00<06:18, 20.91it/s]\n",
+            "Prefilled 10 text tokens, generated 6 speech tokens, current step (275 / 8192):   3%|▎         | 275/8192 [00:00<06:18, 20.91it/s]\n",
+            "Prefilled 10 text tokens, generated 7 speech tokens, current step (276 / 8192):   3%|▎         | 276/8192 [00:00<06:18, 20.91it/s]\n",
+            "Prefilled 10 text tokens, generated 8 speech tokens, current step (277 / 8192):   3%|▎         | 277/8192 [00:00<06:18, 20.91it/s]\n",
+            "Prefilled 10 text tokens, generated 8 speech tokens, current step (277 / 8192):   3%|▎         | 278/8192 [00:01<08:10, 16.12it/s]\n",
+            "Prefilled 10 text tokens, generated 9 speech tokens, current step (278 / 8192):   3%|▎         | 278/8192 [00:01<08:10, 16.12it/s]\n",
+            "Prefilled 10 text tokens, generated 10 speech tokens, current step (279 / 8192):   3%|▎         | 279/8192 [00:01<08:10, 16.12it/s]\n",
+            "Prefilled 10 text tokens, generated 11 speech tokens, current step (280 / 8192):   3%|▎         | 280/8192 [00:01<08:10, 16.12it/s]\n",
+            "Prefilled 10 text tokens, generated 11 speech tokens, current step (280 / 8192):   3%|▎         | 281/8192 [00:01<09:39, 13.66it/s]\n",
+            "Prefilled 10 text tokens, generated 12 speech tokens, current step (281 / 8192):   3%|▎         | 281/8192 [00:01<09:39, 13.66it/s]\n",
+            "Prefilled 15 text tokens, generated 12 speech tokens, current step (286 / 8192):   3%|▎         | 286/8192 [00:01<09:38, 13.66it/s]\n",
+            "Prefilled 15 text tokens, generated 12 speech tokens, current step (286 / 8192):   4%|▎         | 287/8192 [00:01<06:42, 19.62it/s]\n",
+            "Prefilled 15 text tokens, generated 13 speech tokens, current step (287 / 8192):   4%|▎         | 287/8192 [00:01<06:42, 19.62it/s]\n",
+            "Prefilled 15 text tokens, generated 14 speech tokens, current step (288 / 8192):   4%|▎         | 288/8192 [00:01<06:42, 19.62it/s]\n",
+            "Prefilled 15 text tokens, generated 15 speech tokens, current step (289 / 8192):   4%|▎         | 289/8192 [00:01<06:42, 19.62it/s]\n",
+            "Prefilled 15 text tokens, generated 15 speech tokens, current step (289 / 8192):   4%|▎         | 290/8192 [00:01<09:10, 14.37it/s]\n",
+            "Prefilled 15 text tokens, generated 16 speech tokens, current step (290 / 8192):   4%|▎         | 290/8192 [00:01<09:10, 14.37it/s]\n",
+            "Prefilled 15 text tokens, generated 17 speech tokens, current step (291 / 8192):   4%|▎         | 291/8192 [00:02<09:09, 14.37it/s]\n",
+            "Prefilled 15 text tokens, generated 18 speech tokens, current step (292 / 8192):   4%|▎         | 292/8192 [00:02<09:09, 14.37it/s]\n",
+            "Prefilled 15 text tokens, generated 18 speech tokens, current step (292 / 8192):   4%|▎         | 297/8192 [00:02<07:57, 16.52it/s]\n",
+            "Prefilled 20 text tokens, generated 18 speech tokens, current step (297 / 8192):   4%|▎         | 297/8192 [00:02<07:57, 16.52it/s]\n",
+            "Prefilled 20 text tokens, generated 19 speech tokens, current step (298 / 8192):   4%|▎         | 298/8192 [00:02<07:57, 16.52it/s]\n",
+            "Prefilled 20 text tokens, generated 20 speech tokens, current step (299 / 8192):   4%|▎         | 299/8192 [00:02<07:57, 16.52it/s]\n",
+            "Prefilled 20 text tokens, generated 20 speech tokens, current step (299 / 8192):   4%|▎         | 300/8192 [00:02<09:39, 13.61it/s]\n",
+            "Prefilled 20 text tokens, generated 21 speech tokens, current step (300 / 8192):   4%|▎         | 300/8192 [00:02<09:39, 13.61it/s]\n",
+            "Prefilled 20 text tokens, generated 22 speech tokens, current step (301 / 8192):   4%|▎         | 301/8192 [00:02<09:39, 13.61it/s]\n",
+            "Prefilled 20 text tokens, generated 22 speech tokens, current step (301 / 8192):   4%|▎         | 302/8192 [00:02<10:46, 12.21it/s]\n",
+            "Prefilled 20 text tokens, generated 23 speech tokens, current step (302 / 8192):   4%|▎         | 302/8192 [00:02<10:46, 12.21it/s]\n",
+            "Prefilled 20 text tokens, generated 24 speech tokens, current step (303 / 8192):   4%|▎         | 303/8192 [00:03<10:45, 12.21it/s]\n",
+            "Prefilled 20 text tokens, generated 24 speech tokens, current step (303 / 8192):   4%|▍         | 308/8192 [00:03<08:12, 16.02it/s]\n",
+            "Prefilled 25 text tokens, generated 24 speech tokens, current step (308 / 8192):   4%|▍         | 308/8192 [00:03<08:12, 16.02it/s]\n",
+            "Prefilled 25 text tokens, generated 25 speech tokens, current step (309 / 8192):   4%|▍         | 309/8192 [00:03<08:12, 16.02it/s]\n",
+            "Prefilled 25 text tokens, generated 25 speech tokens, current step (309 / 8192):   4%|▍         | 310/8192 [00:03<09:39, 13.60it/s]\n",
+            "Prefilled 25 text tokens, generated 26 speech tokens, current step (310 / 8192):   4%|▍         | 310/8192 [00:03<09:39, 13.60it/s]\n",
+            "Prefilled 25 text tokens, generated 27 speech tokens, current step (311 / 8192):   4%|▍         | 311/8192 [00:03<09:39, 13.60it/s]\n",
+            "Prefilled 25 text tokens, generated 27 speech tokens, current step (311 / 8192):   4%|▍         | 312/8192 [00:03<11:02, 11.90it/s]\n",
+            "Prefilled 25 text tokens, generated 28 speech tokens, current step (312 / 8192):   4%|▍         | 312/8192 [00:03<11:02, 11.90it/s]\n",
+            "Prefilled 25 text tokens, generated 29 speech tokens, current step (313 / 8192):   4%|▍         | 313/8192 [00:03<11:02, 11.90it/s]\n",
+            "Prefilled 25 text tokens, generated 29 speech tokens, current step (313 / 8192):   4%|▍         | 314/8192 [00:03<12:49, 10.24it/s]\n",
+            "Prefilled 25 text tokens, generated 30 speech tokens, current step (314 / 8192):   4%|▍         | 314/8192 [00:03<12:49, 10.24it/s]\n",
+            "Prefilled 30 text tokens, generated 30 speech tokens, current step (319 / 8192):   4%|▍         | 319/8192 [00:03<12:48, 10.24it/s]\n",
+            "Prefilled 30 text tokens, generated 30 speech tokens, current step (319 / 8192):   4%|▍         | 320/8192 [00:04<09:01, 14.55it/s]\n",
+            "Prefilled 30 text tokens, generated 31 speech tokens, current step (320 / 8192):   4%|▍         | 320/8192 [00:04<09:01, 14.55it/s]\n",
+            "Prefilled 30 text tokens, generated 32 speech tokens, current step (321 / 8192):   4%|▍         | 321/8192 [00:04<09:01, 14.55it/s]\n",
+            "Prefilled 30 text tokens, generated 32 speech tokens, current step (321 / 8192):   4%|▍         | 322/8192 [00:04<10:57, 11.97it/s]\n",
+            "Prefilled 30 text tokens, generated 33 speech tokens, current step (322 / 8192):   4%|▍         | 322/8192 [00:04<10:57, 11.97it/s]\n",
+            "Prefilled 30 text tokens, generated 34 speech tokens, current step (323 / 8192):   4%|▍         | 323/8192 [00:04<10:57, 11.97it/s]\n",
+            "Prefilled 30 text tokens, generated 34 speech tokens, current step (323 / 8192):   4%|▍         | 324/8192 [00:04<11:38, 11.27it/s]\n",
+            "Prefilled 30 text tokens, generated 35 speech tokens, current step (324 / 8192):   4%|▍         | 324/8192 [00:04<11:38, 11.27it/s]\n",
+            "Prefilled 30 text tokens, generated 36 speech tokens, current step (325 / 8192):   4%|▍         | 325/8192 [00:04<11:38, 11.27it/s]\n",
+            "Prefilled 30 text tokens, generated 36 speech tokens, current step (325 / 8192):   4%|▍         | 330/8192 [00:04<07:48, 16.79it/s]\n",
+            "Prefilled 35 text tokens, generated 36 speech tokens, current step (330 / 8192):   4%|▍         | 330/8192 [00:04<07:48, 16.79it/s]\n",
+            "Prefilled 35 text tokens, generated 37 speech tokens, current step (331 / 8192):   4%|▍         | 331/8192 [00:04<07:48, 16.79it/s]\n",
+            "Prefilled 35 text tokens, generated 37 speech tokens, current step (331 / 8192):   4%|▍         | 332/8192 [00:04<08:39, 15.14it/s]\n",
+            "Prefilled 35 text tokens, generated 38 speech tokens, current step (332 / 8192):   4%|▍         | 332/8192 [00:04<08:39, 15.14it/s]\n",
+            "Prefilled 35 text tokens, generated 39 speech tokens, current step (333 / 8192):   4%|▍         | 333/8192 [00:05<08:39, 15.14it/s]\n",
+            "Prefilled 35 text tokens, generated 39 speech tokens, current step (333 / 8192):   4%|▍         | 334/8192 [00:05<09:50, 13.30it/s]\n",
+            "Prefilled 35 text tokens, generated 40 speech tokens, current step (334 / 8192):   4%|▍         | 334/8192 [00:05<09:50, 13.30it/s]\n",
+            "Prefilled 35 text tokens, generated 41 speech tokens, current step (335 / 8192):   4%|▍         | 335/8192 [00:05<09:50, 13.30it/s]\n",
+            "Prefilled 35 text tokens, generated 41 speech tokens, current step (335 / 8192):   4%|▍         | 336/8192 [00:05<10:40, 12.27it/s]\n",
+            "Prefilled 35 text tokens, generated 42 speech tokens, current step (336 / 8192):   4%|▍         | 336/8192 [00:05<10:40, 12.27it/s]\n",
+            "Prefilled 40 text tokens, generated 42 speech tokens, current step (341 / 8192):   4%|▍         | 341/8192 [00:05<10:39, 12.27it/s]\n",
+            "Prefilled 40 text tokens, generated 42 speech tokens, current step (341 / 8192):   4%|▍         | 342/8192 [00:05<06:51, 19.09it/s]\n",
+            "Prefilled 40 text tokens, generated 43 speech tokens, current step (342 / 8192):   4%|▍         | 342/8192 [00:05<06:51, 19.09it/s]\n",
+            "Prefilled 40 text tokens, generated 44 speech tokens, current step (343 / 8192):   4%|▍         | 343/8192 [00:05<06:51, 19.09it/s]\n",
+            "Prefilled 40 text tokens, generated 45 speech tokens, current step (344 / 8192):   4%|▍         | 344/8192 [00:05<06:51, 19.09it/s]\n",
+            "Prefilled 40 text tokens, generated 45 speech tokens, current step (344 / 8192):   4%|▍         | 345/8192 [00:05<08:33, 15.27it/s]\n",
+            "Prefilled 40 text tokens, generated 46 speech tokens, current step (345 / 8192):   4%|▍         | 345/8192 [00:05<08:33, 15.27it/s]\n",
+            "Prefilled 40 text tokens, generated 47 speech tokens, current step (346 / 8192):   4%|▍         | 346/8192 [00:05<08:33, 15.27it/s]\n",
+            "Prefilled 40 text tokens, generated 47 speech tokens, current step (346 / 8192):   4%|▍         | 347/8192 [00:06<09:35, 13.63it/s]\n",
+            "Prefilled 40 text tokens, generated 48 speech tokens, current step (347 / 8192):   4%|▍         | 347/8192 [00:06<09:35, 13.63it/s]\n",
+            "Prefilled 45 text tokens, generated 48 speech tokens, current step (352 / 8192):   4%|▍         | 352/8192 [00:06<09:35, 13.63it/s]\n",
+            "Prefilled 45 text tokens, generated 48 speech tokens, current step (352 / 8192):   4%|▍         | 353/8192 [00:06<06:46, 19.29it/s]\n",
+            "Prefilled 45 text tokens, generated 49 speech tokens, current step (353 / 8192):   4%|▍         | 353/8192 [00:06<06:46, 19.29it/s]\n",
+            "Prefilled 45 text tokens, generated 50 speech tokens, current step (354 / 8192):   4%|▍         | 354/8192 [00:06<06:46, 19.29it/s]\n",
+            "Prefilled 45 text tokens, generated 51 speech tokens, current step (355 / 8192):   4%|▍         | 355/8192 [00:06<06:46, 19.29it/s]\n",
+            "Prefilled 45 text tokens, generated 51 speech tokens, current step (355 / 8192):   4%|▍         | 356/8192 [00:06<08:28, 15.42it/s]\n",
+            "Prefilled 45 text tokens, generated 52 speech tokens, current step (356 / 8192):   4%|▍         | 356/8192 [00:06<08:28, 15.42it/s]\n",
+            "Prefilled 45 text tokens, generated 53 speech tokens, current step (357 / 8192):   4%|▍         | 357/8192 [00:06<08:28, 15.42it/s]\n",
+            "Prefilled 45 text tokens, generated 53 speech tokens, current step (357 / 8192):   4%|▍         | 358/8192 [00:06<09:32, 13.69it/s]\n",
+            "Prefilled 45 text tokens, generated 54 speech tokens, current step (358 / 8192):   4%|▍         | 358/8192 [00:06<09:32, 13.69it/s]\n",
+            "Prefilled 50 text tokens, generated 54 speech tokens, current step (363 / 8192):   4%|▍         | 363/8192 [00:06<09:32, 13.69it/s]\n",
+            "Prefilled 50 text tokens, generated 54 speech tokens, current step (363 / 8192):   4%|▍         | 364/8192 [00:06<06:40, 19.55it/s]\n",
+            "Prefilled 50 text tokens, generated 55 speech tokens, current step (364 / 8192):   4%|▍         | 364/8192 [00:06<06:40, 19.55it/s]\n",
+            "Prefilled 50 text tokens, generated 56 speech tokens, current step (365 / 8192):   4%|▍         | 365/8192 [00:06<06:40, 19.55it/s]\n",
+            "Prefilled 50 text tokens, generated 57 speech tokens, current step (366 / 8192):   4%|▍         | 366/8192 [00:07<06:40, 19.55it/s]\n",
+            "Prefilled 50 text tokens, generated 57 speech tokens, current step (366 / 8192):   4%|▍         | 367/8192 [00:07<08:29, 15.36it/s]\n",
+            "Prefilled 50 text tokens, generated 58 speech tokens, current step (367 / 8192):   4%|▍         | 367/8192 [00:07<08:29, 15.36it/s]\n",
+            "Prefilled 50 text tokens, generated 59 speech tokens, current step (368 / 8192):   4%|▍         | 368/8192 [00:07<08:29, 15.36it/s]\n",
+            "Prefilled 50 text tokens, generated 59 speech tokens, current step (368 / 8192):   5%|▍         | 369/8192 [00:07<09:21, 13.92it/s]\n",
+            "Prefilled 50 text tokens, generated 60 speech tokens, current step (369 / 8192):   5%|▍         | 369/8192 [00:07<09:21, 13.92it/s]\n",
+            "Prefilled 55 text tokens, generated 60 speech tokens, current step (374 / 8192):   5%|▍         | 374/8192 [00:07<09:21, 13.92it/s]\n",
+            "Prefilled 55 text tokens, generated 60 speech tokens, current step (374 / 8192):   5%|▍         | 375/8192 [00:07<06:32, 19.90it/s]\n",
+            "Prefilled 55 text tokens, generated 61 speech tokens, current step (375 / 8192):   5%|▍         | 375/8192 [00:07<06:32, 19.90it/s]\n",
+            "Prefilled 55 text tokens, generated 62 speech tokens, current step (376 / 8192):   5%|▍         | 376/8192 [00:07<06:32, 19.90it/s]\n",
+            "Prefilled 55 text tokens, generated 63 speech tokens, current step (377 / 8192):   5%|▍         | 377/8192 [00:07<06:32, 19.90it/s]\n",
+            "Prefilled 55 text tokens, generated 63 speech tokens, current step (377 / 8192):   5%|▍         | 378/8192 [00:07<08:14, 15.81it/s]\n",
+            "Prefilled 55 text tokens, generated 64 speech tokens, current step (378 / 8192):   5%|▍         | 378/8192 [00:07<08:14, 15.81it/s]\n",
+            "Prefilled 55 text tokens, generated 65 speech tokens, current step (379 / 8192):   5%|▍         | 379/8192 [00:07<08:14, 15.81it/s]\n",
+            "Prefilled 55 text tokens, generated 65 speech tokens, current step (379 / 8192):   5%|▍         | 380/8192 [00:08<09:13, 14.11it/s]\n",
+            "Prefilled 55 text tokens, generated 66 speech tokens, current step (380 / 8192):   5%|▍         | 380/8192 [00:08<09:13, 14.11it/s]\n",
+            "Prefilled 60 text tokens, generated 66 speech tokens, current step (385 / 8192):   5%|▍         | 385/8192 [00:08<09:13, 14.11it/s]\n",
+            "Prefilled 60 text tokens, generated 66 speech tokens, current step (385 / 8192):   5%|▍         | 386/8192 [00:08<06:32, 19.90it/s]\n",
+            "Prefilled 60 text tokens, generated 67 speech tokens, current step (386 / 8192):   5%|▍         | 386/8192 [00:08<06:32, 19.90it/s]\n",
+            "Prefilled 60 text tokens, generated 68 speech tokens, current step (387 / 8192):   5%|▍         | 387/8192 [00:08<06:32, 19.90it/s]\n",
+            "Prefilled 60 text tokens, generated 69 speech tokens, current step (388 / 8192):   5%|▍         | 388/8192 [00:08<06:32, 19.90it/s]\n",
+            "Prefilled 60 text tokens, generated 69 speech tokens, current step (388 / 8192):   5%|▍         | 389/8192 [00:08<08:12, 15.85it/s]\n",
+            "Prefilled 60 text tokens, generated 70 speech tokens, current step (389 / 8192):   5%|▍         | 389/8192 [00:08<08:12, 15.85it/s]\n",
+            "Prefilled 60 text tokens, generated 71 speech tokens, current step (390 / 8192):   5%|▍         | 390/8192 [00:08<08:12, 15.85it/s]\n",
+            "Prefilled 60 text tokens, generated 71 speech tokens, current step (390 / 8192):   5%|▍         | 391/8192 [00:08<09:11, 14.15it/s]\n",
+            "Prefilled 60 text tokens, generated 72 speech tokens, current step (391 / 8192):   5%|▍         | 391/8192 [00:08<09:11, 14.15it/s]\n",
+            "Prefilled 65 text tokens, generated 72 speech tokens, current step (396 / 8192):   5%|▍         | 396/8192 [00:08<09:11, 14.15it/s]\n",
+            "Prefilled 65 text tokens, generated 72 speech tokens, current step (396 / 8192):   5%|▍         | 397/8192 [00:08<06:24, 20.28it/s]\n",
+            "Prefilled 65 text tokens, generated 73 speech tokens, current step (397 / 8192):   5%|▍         | 397/8192 [00:08<06:24, 20.28it/s]\n",
+            "Prefilled 65 text tokens, generated 74 speech tokens, current step (398 / 8192):   5%|▍         | 398/8192 [00:08<06:24, 20.28it/s]\n",
+            "Prefilled 65 text tokens, generated 75 speech tokens, current step (399 / 8192):   5%|▍         | 399/8192 [00:09<06:24, 20.28it/s]\n",
+            "Prefilled 65 text tokens, generated 75 speech tokens, current step (399 / 8192):   5%|▍         | 400/8192 [00:09<08:04, 16.10it/s]\n",
+            "Prefilled 65 text tokens, generated 76 speech tokens, current step (400 / 8192):   5%|▍         | 400/8192 [00:09<08:04, 16.10it/s]\n",
+            "Prefilled 65 text tokens, generated 77 speech tokens, current step (401 / 8192):   5%|▍         | 401/8192 [00:09<08:03, 16.10it/s]\n",
+            "Prefilled 65 text tokens, generated 78 speech tokens, current step (402 / 8192):   5%|▍         | 402/8192 [00:09<08:03, 16.10it/s]\n",
+            "Prefilled 65 text tokens, generated 78 speech tokens, current step (402 / 8192):   5%|▍         | 406/8192 [00:09<07:14, 17.93it/s]\n",
+            "Prefilled 69 text tokens, generated 78 speech tokens, current step (406 / 8192):   5%|▍         | 406/8192 [00:09<07:14, 17.93it/s]\n",
+            "Prefilled 69 text tokens, generated 79 speech tokens, current step (407 / 8192):   5%|▍         | 407/8192 [00:09<07:14, 17.93it/s]\n",
+            "Prefilled 69 text tokens, generated 80 speech tokens, current step (408 / 8192):   5%|▍         | 408/8192 [00:09<07:14, 17.93it/s]\n",
+            "Prefilled 69 text tokens, generated 80 speech tokens, current step (408 / 8192):   5%|▍         | 409/8192 [00:09<08:25, 15.40it/s]\n",
+            "Prefilled 69 text tokens, generated 81 speech tokens, current step (409 / 8192):   5%|▍         | 409/8192 [00:09<08:25, 15.40it/s]\n",
+            "Prefilled 69 text tokens, generated 82 speech tokens, current step (410 / 8192):   5%|▌         | 410/8192 [00:09<08:25, 15.40it/s]\n",
+            "Prefilled 69 text tokens, generated 82 speech tokens, current step (410 / 8192):   5%|▌         | 411/8192 [00:09<09:19, 13.91it/s]\n",
+            "Prefilled 69 text tokens, generated 83 speech tokens, current step (411 / 8192):   5%|▌         | 411/8192 [00:09<09:19, 13.91it/s]\n",
+            "Prefilled 69 text tokens, generated 84 speech tokens, current step (412 / 8192):   5%|▌         | 412/8192 [00:10<09:19, 13.91it/s]\n",
+            "Prefilled 69 text tokens, generated 84 speech tokens, current step (412 / 8192):   5%|▌         | 413/8192 [00:10<10:14, 12.66it/s]\n",
+            "Prefilled 69 text tokens, generated 85 speech tokens, current step (413 / 8192):   5%|▌         | 413/8192 [00:10<10:14, 12.66it/s]\n",
+            "Prefilled 69 text tokens, generated 86 speech tokens, current step (414 / 8192):   5%|▌         | 414/8192 [00:10<10:14, 12.66it/s]\n",
+            "Prefilled 69 text tokens, generated 86 speech tokens, current step (414 / 8192):   5%|▌         | 415/8192 [00:10<11:04, 11.69it/s]\n",
+            "Prefilled 69 text tokens, generated 87 speech tokens, current step (415 / 8192):   5%|▌         | 415/8192 [00:10<11:04, 11.69it/s]\n",
+            "Prefilled 69 text tokens, generated 88 speech tokens, current step (416 / 8192):   5%|▌         | 416/8192 [00:10<11:04, 11.69it/s]\n",
+            "Prefilled 69 text tokens, generated 88 speech tokens, current step (416 / 8192):   5%|▌         | 417/8192 [00:10<11:36, 11.17it/s]\n",
+            "Prefilled 69 text tokens, generated 89 speech tokens, current step (417 / 8192):   5%|▌         | 417/8192 [00:10<11:36, 11.17it/s]\n",
+            "Prefilled 69 text tokens, generated 90 speech tokens, current step (418 / 8192):   5%|▌         | 418/8192 [00:10<11:36, 11.17it/s]\n",
+            "Prefilled 69 text tokens, generated 90 speech tokens, current step (418 / 8192):   5%|▌         | 419/8192 [00:10<12:08, 10.67it/s]\n",
+            "Prefilled 69 text tokens, generated 91 speech tokens, current step (419 / 8192):   5%|▌         | 419/8192 [00:10<12:08, 10.67it/s]\n",
+            "Prefilled 69 text tokens, generated 92 speech tokens, current step (420 / 8192):   5%|▌         | 420/8192 [00:10<12:08, 10.67it/s]\n",
+            "Prefilled 69 text tokens, generated 92 speech tokens, current step (420 / 8192):   5%|▌         | 421/8192 [00:11<12:30, 10.36it/s]\n",
+            "Prefilled 69 text tokens, generated 93 speech tokens, current step (421 / 8192):   5%|▌         | 421/8192 [00:11<12:30, 10.36it/s]\n",
+            "Prefilled 69 text tokens, generated 94 speech tokens, current step (422 / 8192):   5%|▌         | 422/8192 [00:11<12:30, 10.36it/s]\n",
+            "Prefilled 69 text tokens, generated 94 speech tokens, current step (422 / 8192):   5%|▌         | 423/8192 [00:11<12:51, 10.08it/s]\n",
+            "Prefilled 69 text tokens, generated 95 speech tokens, current step (423 / 8192):   5%|▌         | 423/8192 [00:11<12:51, 10.08it/s]\n",
+            "Prefilled 69 text tokens, generated 96 speech tokens, current step (424 / 8192):   5%|▌         | 424/8192 [00:11<12:51, 10.08it/s]\n",
+            "Prefilled 69 text tokens, generated 96 speech tokens, current step (424 / 8192):   5%|▌         | 425/8192 [00:11<13:04,  9.90it/s]\n",
+            "Prefilled 69 text tokens, generated 97 speech tokens, current step (425 / 8192):   5%|▌         | 425/8192 [00:11<13:04,  9.90it/s]\n",
+            "Prefilled 69 text tokens, generated 97 speech tokens, current step (425 / 8192):   5%|▌         | 426/8192 [00:11<13:03,  9.91it/s]\n",
+            "Prefilled 69 text tokens, generated 98 speech tokens, current step (426 / 8192):   5%|▌         | 426/8192 [00:11<13:03,  9.91it/s]\n",
+            "Prefilled 69 text tokens, generated 98 speech tokens, current step (426 / 8192):   5%|▌         | 427/8192 [00:11<13:12,  9.80it/s]\n",
+            "Prefilled 69 text tokens, generated 99 speech tokens, current step (427 / 8192):   5%|▌         | 427/8192 [00:11<13:12,  9.80it/s]\n",
+            "Prefilled 69 text tokens, generated 99 speech tokens, current step (427 / 8192):   5%|▌         | 428/8192 [00:11<13:18,  9.73it/s]\n",
+            "Prefilled 69 text tokens, generated 100 speech tokens, current step (428 / 8192):   5%|▌         | 428/8192 [00:11<13:18,  9.73it/s]\n",
+            "Prefilled 69 text tokens, generated 100 speech tokens, current step (428 / 8192):   5%|▌         | 429/8192 [00:11<13:15,  9.76it/s]\n",
+            "Prefilled 69 text tokens, generated 101 speech tokens, current step (429 / 8192):   5%|▌         | 429/8192 [00:11<13:15,  9.76it/s]\n",
+            "Prefilled 69 text tokens, generated 101 speech tokens, current step (429 / 8192):   5%|▌         | 430/8192 [00:11<13:18,  9.72it/s]\n",
+            "Prefilled 69 text tokens, generated 102 speech tokens, current step (430 / 8192):   5%|▌         | 430/8192 [00:11<13:18,  9.72it/s]\n",
+            "Prefilled 69 text tokens, generated 102 speech tokens, current step (430 / 8192):   5%|▌         | 431/8192 [00:12<13:18,  9.71it/s]\n",
+            "Prefilled 69 text tokens, generated 103 speech tokens, current step (431 / 8192):   5%|▌         | 431/8192 [00:12<13:18,  9.71it/s]\n",
+            "Prefilled 69 text tokens, generated 103 speech tokens, current step (431 / 8192):   5%|▌         | 432/8192 [00:12<13:18,  9.72it/s]\n",
+            "Prefilled 69 text tokens, generated 104 speech tokens, current step (432 / 8192):   5%|▌         | 432/8192 [00:12<13:18,  9.72it/s]\n",
+            "Prefilled 69 text tokens, generated 104 speech tokens, current step (432 / 8192):   5%|▌         | 433/8192 [00:12<13:31,  9.56it/s]\n",
+            "Prefilled 69 text tokens, generated 105 speech tokens, current step (433 / 8192):   5%|▌         | 433/8192 [00:12<13:31,  9.56it/s]\n",
+            "Prefilled 69 text tokens, generated 105 speech tokens, current step (433 / 8192):   5%|▌         | 434/8192 [00:12<13:52,  9.32it/s]\n",
+            "Prefilled 69 text tokens, generated 106 speech tokens, current step (434 / 8192):   5%|▌         | 434/8192 [00:12<13:52,  9.32it/s]\n",
+            "Prefilled 69 text tokens, generated 106 speech tokens, current step (434 / 8192):   5%|▌         | 435/8192 [00:12<13:48,  9.36it/s]\n",
+            "Prefilled 69 text tokens, generated 107 speech tokens, current step (435 / 8192):   5%|▌         | 435/8192 [00:12<13:48,  9.36it/s]\n",
+            "Prefilled 69 text tokens, generated 107 speech tokens, current step (435 / 8192):   5%|▌         | 436/8192 [00:12<13:39,  9.46it/s]\n",
+            "Prefilled 69 text tokens, generated 108 speech tokens, current step (436 / 8192):   5%|▌         | 436/8192 [00:12<13:39,  9.46it/s]\n",
+            "Prefilled 69 text tokens, generated 108 speech tokens, current step (436 / 8192):   5%|▌         | 437/8192 [00:12<13:34,  9.52it/s]\n",
+            "Prefilled 69 text tokens, generated 109 speech tokens, current step (437 / 8192):   5%|▌         | 437/8192 [00:12<13:34,  9.52it/s]\n",
+            "Prefilled 69 text tokens, generated 109 speech tokens, current step (437 / 8192):   5%|▌         | 438/8192 [00:12<13:31,  9.55it/s]\n",
+            "Prefilled 69 text tokens, generated 110 speech tokens, current step (438 / 8192):   5%|▌         | 438/8192 [00:12<13:31,  9.55it/s]\n",
+            "Prefilled 69 text tokens, generated 110 speech tokens, current step (438 / 8192):   5%|▌         | 439/8192 [00:12<13:22,  9.67it/s]\n",
+            "Prefilled 69 text tokens, generated 111 speech tokens, current step (439 / 8192):   5%|▌         | 439/8192 [00:12<13:22,  9.67it/s]\n",
+            "Prefilled 69 text tokens, generated 111 speech tokens, current step (439 / 8192):   5%|▌         | 440/8192 [00:13<13:15,  9.74it/s]\n",
+            "Prefilled 69 text tokens, generated 112 speech tokens, current step (440 / 8192):   5%|▌         | 440/8192 [00:13<13:15,  9.74it/s]\n",
+            "Prefilled 69 text tokens, generated 112 speech tokens, current step (440 / 8192):   5%|▌         | 441/8192 [00:13<13:18,  9.70it/s]\n",
+            "Prefilled 69 text tokens, generated 113 speech tokens, current step (441 / 8192):   5%|▌         | 441/8192 [00:13<13:18,  9.70it/s]\n",
+            "Prefilled 69 text tokens, generated 113 speech tokens, current step (441 / 8192):   5%|▌         | 442/8192 [00:13<13:23,  9.64it/s]\n",
+            "Prefilled 69 text tokens, generated 114 speech tokens, current step (442 / 8192):   5%|▌         | 442/8192 [00:13<13:23,  9.64it/s]\n",
+            "Prefilled 69 text tokens, generated 114 speech tokens, current step (442 / 8192):   5%|▌         | 443/8192 [00:13<13:19,  9.69it/s]\n",
+            "Prefilled 69 text tokens, generated 115 speech tokens, current step (443 / 8192):   5%|▌         | 443/8192 [00:13<13:19,  9.69it/s]\n",
+            "Prefilled 69 text tokens, generated 115 speech tokens, current step (443 / 8192):   5%|▌         | 444/8192 [00:13<13:54,  9.29it/s]\n",
+            "Prefilled 69 text tokens, generated 116 speech tokens, current step (444 / 8192):   5%|▌         | 444/8192 [00:13<13:54,  9.29it/s]\n",
+            "Prefilled 69 text tokens, generated 116 speech tokens, current step (444 / 8192):   5%|▌         | 445/8192 [00:13<13:56,  9.26it/s]\n",
+            "Prefilled 69 text tokens, generated 117 speech tokens, current step (445 / 8192):   5%|▌         | 445/8192 [00:13<13:56,  9.26it/s]\n",
+            "Prefilled 69 text tokens, generated 117 speech tokens, current step (445 / 8192):   5%|▌         | 446/8192 [00:13<14:03,  9.19it/s]\n",
+            "Prefilled 69 text tokens, generated 118 speech tokens, current step (446 / 8192):   5%|▌         | 446/8192 [00:13<14:03,  9.19it/s]\n",
+            "Prefilled 69 text tokens, generated 118 speech tokens, current step (446 / 8192):   5%|▌         | 447/8192 [00:13<13:59,  9.23it/s]\n",
+            "Prefilled 69 text tokens, generated 119 speech tokens, current step (447 / 8192):   5%|▌         | 447/8192 [00:13<13:59,  9.23it/s]\n",
+            "Prefilled 69 text tokens, generated 119 speech tokens, current step (447 / 8192):   5%|▌         | 448/8192 [00:13<13:50,  9.33it/s]\n",
+            "Prefilled 69 text tokens, generated 120 speech tokens, current step (448 / 8192):   5%|▌         | 448/8192 [00:13<13:50,  9.33it/s]\n",
+            "Prefilled 69 text tokens, generated 120 speech tokens, current step (448 / 8192):   5%|▌         | 449/8192 [00:13<13:43,  9.41it/s]\n",
+            "Prefilled 69 text tokens, generated 121 speech tokens, current step (449 / 8192):   5%|▌         | 449/8192 [00:13<13:43,  9.41it/s]\n",
+            "Prefilled 69 text tokens, generated 121 speech tokens, current step (449 / 8192):   5%|▌         | 450/8192 [00:14<13:39,  9.45it/s]\n",
+            "Prefilled 69 text tokens, generated 122 speech tokens, current step (450 / 8192):   5%|▌         | 450/8192 [00:14<13:39,  9.45it/s]\n",
+            "Prefilled 69 text tokens, generated 122 speech tokens, current step (450 / 8192):   6%|▌         | 451/8192 [00:14<13:41,  9.42it/s]\n",
+            "Prefilled 69 text tokens, generated 123 speech tokens, current step (451 / 8192):   6%|▌         | 451/8192 [00:14<13:41,  9.42it/s]\n",
+            "Prefilled 69 text tokens, generated 123 speech tokens, current step (451 / 8192):   6%|▌         | 452/8192 [00:14<13:51,  9.31it/s]\n",
+            "Prefilled 69 text tokens, generated 124 speech tokens, current step (452 / 8192):   6%|▌         | 452/8192 [00:14<13:51,  9.31it/s]\n",
+            "Prefilled 69 text tokens, generated 124 speech tokens, current step (452 / 8192):   6%|▌         | 453/8192 [00:14<14:39,  8.80it/s]\n",
+            "Prefilled 69 text tokens, generated 125 speech tokens, current step (453 / 8192):   6%|▌         | 453/8192 [00:14<14:39,  8.80it/s]\n",
+            "Prefilled 69 text tokens, generated 125 speech tokens, current step (453 / 8192):   6%|▌         | 454/8192 [00:14<15:39,  8.24it/s]\n",
+            "Prefilled 69 text tokens, generated 126 speech tokens, current step (454 / 8192):   6%|▌         | 454/8192 [00:14<15:39,  8.24it/s]\n",
+            "\n",
+            "INFO:     connection closed\n"
+          ]
+        }
+      ],
       "source": [
         "import subprocess, re, time, threading\n",
         "\n",
@@ -189,10 +1174,10 @@
     "accelerator": "GPU",
     "colab": {
       "gpuType": "T4",
-      "include_colab_link": true,
       "machine_shape": "hm",
       "name": "VibeVoice_Colab.ipynb",
-      "provenance": []
+      "provenance": [],
+      "include_colab_link": true
     },
     "kernelspec": {
       "display_name": "Python 3",
@@ -209,8 +1194,3351 @@
       "nbconvert_exporter": "python",
       "pygments_lexer": "ipython3",
       "version": "3.10.11"
+    },
+    "widgets": {
+      "application/vnd.jupyter.widget-state+json": {
+        "6aa0514fe8e74f87a8d25e2a3ec7b249": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_2e77995f5e9b4c9d93a1e50482e63464",
+              "IPY_MODEL_5bddb298cd604fbba0776657ef807664",
+              "IPY_MODEL_398d6a88664b44c89b06610a1b5eb33e"
+            ],
+            "layout": "IPY_MODEL_23e9f1b01aa6454bb8f63b74aaa333f5"
+          }
+        },
+        "2e77995f5e9b4c9d93a1e50482e63464": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_411a5e8e282b4257b561655c637836ab",
+            "placeholder": "​",
+            "style": "IPY_MODEL_a85f891d3eb946fa94af2eff7024bc76",
+            "value": "Fetching 6 files: 100%"
+          }
+        },
+        "5bddb298cd604fbba0776657ef807664": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_f112df2ccc7b4861a27f5336d38ac86f",
+            "max": 6,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_24d904f0c7f94a749af6d440b475bdeb",
+            "value": 6
+          }
+        },
+        "398d6a88664b44c89b06610a1b5eb33e": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_5e994c7530c64e8ab571751a12684217",
+            "placeholder": "​",
+            "style": "IPY_MODEL_52eb275fb2ef41e1ba008baef9378dfe",
+            "value": " 6/6 [00:15&lt;00:00,  4.20s/it]"
+          }
+        },
+        "23e9f1b01aa6454bb8f63b74aaa333f5": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "411a5e8e282b4257b561655c637836ab": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "a85f891d3eb946fa94af2eff7024bc76": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "f112df2ccc7b4861a27f5336d38ac86f": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "24d904f0c7f94a749af6d440b475bdeb": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "5e994c7530c64e8ab571751a12684217": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "52eb275fb2ef41e1ba008baef9378dfe": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "0d8d3ac2411048a7b846835d60e4f23d": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_bc3d23550b01450e94574975277bf5a2",
+              "IPY_MODEL_0df051569bd540b7a19e3aefdc69f7cd",
+              "IPY_MODEL_b4351182f3b7462cbf915b26863cf4de"
+            ],
+            "layout": "IPY_MODEL_dae8d2fe62bd41ea9d99c9ccc817de46"
+          }
+        },
+        "bc3d23550b01450e94574975277bf5a2": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_e35dd504906745b28846c07a644c3423",
+            "placeholder": "​",
+            "style": "IPY_MODEL_8171a7d8dcb9432881aa56fb52743e3d",
+            "value": "figures/Fig1.png: 100%"
+          }
+        },
+        "0df051569bd540b7a19e3aefdc69f7cd": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_2058d4fb6b1745a2a971491fcc747244",
+            "max": 123543,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_c3311a8331244551843472284c58f60f",
+            "value": 123543
+          }
+        },
+        "b4351182f3b7462cbf915b26863cf4de": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_ddd6507456c9496db1525c87994c5e4a",
+            "placeholder": "​",
+            "style": "IPY_MODEL_be663377d2864ba3a4c6832ed9d77a3d",
+            "value": " 124k/124k [00:00&lt;00:00, 278kB/s]"
+          }
+        },
+        "dae8d2fe62bd41ea9d99c9ccc817de46": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "e35dd504906745b28846c07a644c3423": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "8171a7d8dcb9432881aa56fb52743e3d": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "2058d4fb6b1745a2a971491fcc747244": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "c3311a8331244551843472284c58f60f": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "ddd6507456c9496db1525c87994c5e4a": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "be663377d2864ba3a4c6832ed9d77a3d": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "06dd326664c2487f8195c15c56326273": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_45b8402a7ce240c5b3e84520af47e6e3",
+              "IPY_MODEL_f6374d57d06f4234ba5b29acbbec7c8d",
+              "IPY_MODEL_cde3a6c088e545cf94e2ccc73655eff2"
+            ],
+            "layout": "IPY_MODEL_60723c32638d47dd81281d31ddc5eb66"
+          }
+        },
+        "45b8402a7ce240c5b3e84520af47e6e3": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_b79622d7dc0e46e28ebd17d730bfe91d",
+            "placeholder": "​",
+            "style": "IPY_MODEL_027f223a86a249dd88b1010dc85f679f",
+            "value": "model.safetensors: 100%"
+          }
+        },
+        "f6374d57d06f4234ba5b29acbbec7c8d": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_7bf175a6594a4417899953186dfa8a97",
+            "max": 2035332888,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_620f2c3ccaac4028bd2668a12dc57749",
+            "value": 2035332888
+          }
+        },
+        "cde3a6c088e545cf94e2ccc73655eff2": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_1186b85637f2496ba1366ab4d2d2a11d",
+            "placeholder": "​",
+            "style": "IPY_MODEL_6e0d9876d9f94fca889a959b09319474",
+            "value": " 2.04G/2.04G [00:15&lt;00:00, 98.2MB/s]"
+          }
+        },
+        "60723c32638d47dd81281d31ddc5eb66": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "b79622d7dc0e46e28ebd17d730bfe91d": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "027f223a86a249dd88b1010dc85f679f": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "7bf175a6594a4417899953186dfa8a97": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "620f2c3ccaac4028bd2668a12dc57749": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "1186b85637f2496ba1366ab4d2d2a11d": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "6e0d9876d9f94fca889a959b09319474": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "422ea9b78c584d1ca555728cd01e861b": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_063ce9a58fc748e7929ed70a72c1b287",
+              "IPY_MODEL_75ebd541b72941b3935a96da96615293",
+              "IPY_MODEL_7c6ad8b88a7c49ca980f14bb03fd1463"
+            ],
+            "layout": "IPY_MODEL_eb94263072dc4ab78a2f125840a5dda5"
+          }
+        },
+        "063ce9a58fc748e7929ed70a72c1b287": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_81ae6a64fbee460ab6c15b5cc0448474",
+            "placeholder": "​",
+            "style": "IPY_MODEL_3607d7c97912499191b8b632f29bc31d",
+            "value": "config.json: "
+          }
+        },
+        "75ebd541b72941b3935a96da96615293": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_9006110b3b8043dfbe85d1c485242834",
+            "max": 1,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_4ca65f86d3a344eeb43f1e10ce2bade7",
+            "value": 1
+          }
+        },
+        "7c6ad8b88a7c49ca980f14bb03fd1463": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_8fee63d65695482f9c68294816a98a6b",
+            "placeholder": "​",
+            "style": "IPY_MODEL_73e3840872fe4245aa88c315fe266214",
+            "value": " 2.12k/? [00:00&lt;00:00, 179kB/s]"
+          }
+        },
+        "eb94263072dc4ab78a2f125840a5dda5": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "81ae6a64fbee460ab6c15b5cc0448474": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "3607d7c97912499191b8b632f29bc31d": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "9006110b3b8043dfbe85d1c485242834": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": "20px"
+          }
+        },
+        "4ca65f86d3a344eeb43f1e10ce2bade7": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "8fee63d65695482f9c68294816a98a6b": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "73e3840872fe4245aa88c315fe266214": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "f133d8b35d8f461d9e3b0c099d56dc98": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_c6c3ec7e97554e3f930cdcab2e3002fa",
+              "IPY_MODEL_73a5e9fc2808494485db6768fdb6ac6e",
+              "IPY_MODEL_d30457cbc6fa4a54902bc92640af82ce"
+            ],
+            "layout": "IPY_MODEL_a9c4e87ff31e458187e09e93b23bcaed"
+          }
+        },
+        "c6c3ec7e97554e3f930cdcab2e3002fa": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_0af92bfff186463ab480139f415b3f45",
+            "placeholder": "​",
+            "style": "IPY_MODEL_2974cc410d6e40d89cdb0a600943d70e",
+            "value": ".gitattributes: "
+          }
+        },
+        "73a5e9fc2808494485db6768fdb6ac6e": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_f48cf6761d6d493cb76c0030249baa11",
+            "max": 1,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_3ea8f4b8b4e54b99a48d410fe9659f96",
+            "value": 1
+          }
+        },
+        "d30457cbc6fa4a54902bc92640af82ce": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_4a7829162a704c62b40823c359c5c86e",
+            "placeholder": "​",
+            "style": "IPY_MODEL_c23a9a4b3ab044d6af40f293d7249733",
+            "value": " 1.57k/? [00:00&lt;00:00, 203kB/s]"
+          }
+        },
+        "a9c4e87ff31e458187e09e93b23bcaed": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "0af92bfff186463ab480139f415b3f45": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "2974cc410d6e40d89cdb0a600943d70e": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "f48cf6761d6d493cb76c0030249baa11": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": "20px"
+          }
+        },
+        "3ea8f4b8b4e54b99a48d410fe9659f96": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "4a7829162a704c62b40823c359c5c86e": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "c23a9a4b3ab044d6af40f293d7249733": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "50ac88eac535450a8f249f52092d2406": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_9ab10fe6f69d40de8a90d924288611bd",
+              "IPY_MODEL_94a9a23ebefa45ad9604bcf353844337",
+              "IPY_MODEL_e687b3ff73cb4b42964d46ade98a2b65"
+            ],
+            "layout": "IPY_MODEL_c705ff6baaf5438b93dbc4107b1c4305"
+          }
+        },
+        "9ab10fe6f69d40de8a90d924288611bd": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_306e3356465c4898a5f2b5ccb29aaa7c",
+            "placeholder": "​",
+            "style": "IPY_MODEL_9ec13363e1f046368343d27f41b08f19",
+            "value": "preprocessor_config.json: 100%"
+          }
+        },
+        "94a9a23ebefa45ad9604bcf353844337": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_1350cc445a004aff895cab877697cc3c",
+            "max": 360,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_48bc89fef2724841b2f182cc6eed35e0",
+            "value": 360
+          }
+        },
+        "e687b3ff73cb4b42964d46ade98a2b65": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_68ffa713da0a4b01b2c42e0c8a27835e",
+            "placeholder": "​",
+            "style": "IPY_MODEL_a8e4a36558e04810b203b32cdd298ffb",
+            "value": " 360/360 [00:00&lt;00:00, 26.8kB/s]"
+          }
+        },
+        "c705ff6baaf5438b93dbc4107b1c4305": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "306e3356465c4898a5f2b5ccb29aaa7c": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "9ec13363e1f046368343d27f41b08f19": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "1350cc445a004aff895cab877697cc3c": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "48bc89fef2724841b2f182cc6eed35e0": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "68ffa713da0a4b01b2c42e0c8a27835e": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "a8e4a36558e04810b203b32cdd298ffb": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "5b08b3a3aa6b4c0fb19167850be8453d": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_884ec6a31fdf410e92c5ea89c0e1419b",
+              "IPY_MODEL_3e99d2ab170c45fe844cb81fed3ee1d7",
+              "IPY_MODEL_4e2e16fb3c5e41429a3660f65c488d8f"
+            ],
+            "layout": "IPY_MODEL_058a4595e6c042bfa0df510046f1109d"
+          }
+        },
+        "884ec6a31fdf410e92c5ea89c0e1419b": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_5c2b36b95d60431a8bbf553e408f4f51",
+            "placeholder": "​",
+            "style": "IPY_MODEL_a695abbe11304923bb22390b6b8d7af2",
+            "value": "README.md: "
+          }
+        },
+        "3e99d2ab170c45fe844cb81fed3ee1d7": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_47885c9ca7c943d18b0f6529ca6a8238",
+            "max": 1,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_772eb2290aef43e4947878efd7794ce7",
+            "value": 1
+          }
+        },
+        "4e2e16fb3c5e41429a3660f65c488d8f": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_53f6ef4e80384e8aa06628a35c354e8f",
+            "placeholder": "​",
+            "style": "IPY_MODEL_83077e8e24ef484ab79eb4eefd441c80",
+            "value": " 10.2k/? [00:00&lt;00:00, 1.07MB/s]"
+          }
+        },
+        "058a4595e6c042bfa0df510046f1109d": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "5c2b36b95d60431a8bbf553e408f4f51": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "a695abbe11304923bb22390b6b8d7af2": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "47885c9ca7c943d18b0f6529ca6a8238": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": "20px"
+          }
+        },
+        "772eb2290aef43e4947878efd7794ce7": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "53f6ef4e80384e8aa06628a35c354e8f": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "83077e8e24ef484ab79eb4eefd441c80": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "9c57910a71314b5ab996439e5130adfe": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "VBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "VBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "VBoxView",
+            "box_style": "",
+            "children": [],
+            "layout": "IPY_MODEL_8f96189e4dd146679c62ae79e1ecc4b1"
+          }
+        },
+        "caf8f6f8920d4f01aa2af4f9e6fcb3dc": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_687266971acc4ab1b03813bc8a3b8e76",
+            "placeholder": "​",
+            "style": "IPY_MODEL_4bde1aea8d194644b4e9021f09503800",
+            "value": "<center> <img\nsrc=https://huggingface.co/front/assets/huggingface_logo-noborder.svg\nalt='Hugging Face'> <br> Copy a token from <a\nhref=\"https://huggingface.co/settings/tokens\" target=\"_blank\">your Hugging Face\ntokens page</a> and paste it below. <br> Immediately click login after copying\nyour token or it might be stored in plain text in this notebook file. </center>"
+          }
+        },
+        "afaace7433ee4538844cd73480589dda": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "PasswordModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "PasswordModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "PasswordView",
+            "continuous_update": true,
+            "description": "Token:",
+            "description_tooltip": null,
+            "disabled": false,
+            "layout": "IPY_MODEL_fa49258b8fe3441a82c22e9b60a955df",
+            "placeholder": "​",
+            "style": "IPY_MODEL_40db57ec16eb4e4ba4cd506abaf4069b",
+            "value": ""
+          }
+        },
+        "70fadafd4db04a0783e329362ba8b87c": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "CheckboxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "CheckboxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "CheckboxView",
+            "description": "Add token as git credential?",
+            "description_tooltip": null,
+            "disabled": false,
+            "indent": true,
+            "layout": "IPY_MODEL_b17a44ac600746f6a1825cbb0cc063be",
+            "style": "IPY_MODEL_683c557013424a18a85422835b75a8e3",
+            "value": true
+          }
+        },
+        "dfcc460d6f424736be2fb25530b09185": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ButtonModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ButtonModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ButtonView",
+            "button_style": "",
+            "description": "Login",
+            "disabled": false,
+            "icon": "",
+            "layout": "IPY_MODEL_2e5bc5e6f4ef48b0b00424049cec8a09",
+            "style": "IPY_MODEL_b13735cb5c4249a08d8c7cfa654ba106",
+            "tooltip": ""
+          }
+        },
+        "c004c599ecc943e18ee873d55ee630ea": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_161a12ab57aa41638a846a2238bf9642",
+            "placeholder": "​",
+            "style": "IPY_MODEL_0332ed76bfde46c49c9879f36e75f6f3",
+            "value": "\n<b>Pro Tip:</b> If you don't already have one, you can create a dedicated\n'notebooks' token with 'write' access, that you can then easily reuse for all\nnotebooks. </center>"
+          }
+        },
+        "8f96189e4dd146679c62ae79e1ecc4b1": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": "center",
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": "flex",
+            "flex": null,
+            "flex_flow": "column",
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": "50%"
+          }
+        },
+        "687266971acc4ab1b03813bc8a3b8e76": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "4bde1aea8d194644b4e9021f09503800": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "fa49258b8fe3441a82c22e9b60a955df": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "40db57ec16eb4e4ba4cd506abaf4069b": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "b17a44ac600746f6a1825cbb0cc063be": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "683c557013424a18a85422835b75a8e3": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "2e5bc5e6f4ef48b0b00424049cec8a09": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "b13735cb5c4249a08d8c7cfa654ba106": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ButtonStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ButtonStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "button_color": null,
+            "font_weight": ""
+          }
+        },
+        "161a12ab57aa41638a846a2238bf9642": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "0332ed76bfde46c49c9879f36e75f6f3": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "2d2751bc81ca4bd5bef927b23a99ee93": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "LabelModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "LabelModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "LabelView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_8deb0245c1164c0192ac324a38f32971",
+            "placeholder": "​",
+            "style": "IPY_MODEL_054055b8c233424d82c435f0d453fa56",
+            "value": "Connecting..."
+          }
+        },
+        "8deb0245c1164c0192ac324a38f32971": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "054055b8c233424d82c435f0d453fa56": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "a6612ce289c246668325ec1c50b01a3e": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HBoxModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HBoxModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HBoxView",
+            "box_style": "",
+            "children": [
+              "IPY_MODEL_c85a7873e70f4345a071cbe453bbe801",
+              "IPY_MODEL_045a67c7b0cf467b8066370dd9e7ffef",
+              "IPY_MODEL_8c84ea605447464f84e6b51f0790461b"
+            ],
+            "layout": "IPY_MODEL_9486fe93c26c4ab18b26c6c06d87c9f0"
+          }
+        },
+        "c85a7873e70f4345a071cbe453bbe801": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_405497428efc4015932fc2e76ceb110f",
+            "placeholder": "​",
+            "style": "IPY_MODEL_a8d7ef0c5f18419983e1c3077deb4154",
+            "value": "Fetching 6 files: 100%"
+          }
+        },
+        "045a67c7b0cf467b8066370dd9e7ffef": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "FloatProgressModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "FloatProgressModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "ProgressView",
+            "bar_style": "success",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_04a4242afe6c4fb19aed5282d9110df2",
+            "max": 6,
+            "min": 0,
+            "orientation": "horizontal",
+            "style": "IPY_MODEL_27adab0a48c24c3ba388c7ed0cbc8073",
+            "value": 6
+          }
+        },
+        "8c84ea605447464f84e6b51f0790461b": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "HTMLModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_dom_classes": [],
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "HTMLModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/controls",
+            "_view_module_version": "1.5.0",
+            "_view_name": "HTMLView",
+            "description": "",
+            "description_tooltip": null,
+            "layout": "IPY_MODEL_8987b61805774e3fbc660b1ddf477fff",
+            "placeholder": "​",
+            "style": "IPY_MODEL_9f543c4a97314ebd836f0f8ce3f525cb",
+            "value": " 6/6 [00:00&lt;00:00, 391.95it/s]"
+          }
+        },
+        "9486fe93c26c4ab18b26c6c06d87c9f0": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "405497428efc4015932fc2e76ceb110f": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "a8d7ef0c5f18419983e1c3077deb4154": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        },
+        "04a4242afe6c4fb19aed5282d9110df2": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "27adab0a48c24c3ba388c7ed0cbc8073": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "ProgressStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "ProgressStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "bar_color": null,
+            "description_width": ""
+          }
+        },
+        "8987b61805774e3fbc660b1ddf477fff": {
+          "model_module": "@jupyter-widgets/base",
+          "model_name": "LayoutModel",
+          "model_module_version": "1.2.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/base",
+            "_model_module_version": "1.2.0",
+            "_model_name": "LayoutModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "LayoutView",
+            "align_content": null,
+            "align_items": null,
+            "align_self": null,
+            "border": null,
+            "bottom": null,
+            "display": null,
+            "flex": null,
+            "flex_flow": null,
+            "grid_area": null,
+            "grid_auto_columns": null,
+            "grid_auto_flow": null,
+            "grid_auto_rows": null,
+            "grid_column": null,
+            "grid_gap": null,
+            "grid_row": null,
+            "grid_template_areas": null,
+            "grid_template_columns": null,
+            "grid_template_rows": null,
+            "height": null,
+            "justify_content": null,
+            "justify_items": null,
+            "left": null,
+            "margin": null,
+            "max_height": null,
+            "max_width": null,
+            "min_height": null,
+            "min_width": null,
+            "object_fit": null,
+            "object_position": null,
+            "order": null,
+            "overflow": null,
+            "overflow_x": null,
+            "overflow_y": null,
+            "padding": null,
+            "right": null,
+            "top": null,
+            "visibility": null,
+            "width": null
+          }
+        },
+        "9f543c4a97314ebd836f0f8ce3f525cb": {
+          "model_module": "@jupyter-widgets/controls",
+          "model_name": "DescriptionStyleModel",
+          "model_module_version": "1.5.0",
+          "state": {
+            "_model_module": "@jupyter-widgets/controls",
+            "_model_module_version": "1.5.0",
+            "_model_name": "DescriptionStyleModel",
+            "_view_count": null,
+            "_view_module": "@jupyter-widgets/base",
+            "_view_module_version": "1.2.0",
+            "_view_name": "StyleView",
+            "description_width": ""
+          }
+        }
+      }
     }
   },
   "nbformat": 4,
   "nbformat_minor": 5
-}
+}
\ No newline at end of file
diff --git a/docs/vibevoice-realtime-0.5b.md b/docs/vibevoice-realtime-0.5b.md
index dfb2f25..a590819 100644
--- a/docs/vibevoice-realtime-0.5b.md
+++ b/docs/vibevoice-realtime-0.5b.md
@@ -121,11 +121,29 @@ Tip: Just try it on [Colab](https://colab.research.google.com/github/microsoft/V
 python demo/realtime_model_inference_from_file.py --model_path microsoft/VibeVoice-Realtime-0.5B --txt_path demo/text_examples/1p_vibevoice.txt --speaker_name Carter
 ```
 
-### [Optional] More experimental voices 
-Download additional experimental multi-lingual speakers before launching demo or inference from files.
+### Usage 3: List available voices
+A voice listing utility is available to help you discover and browse all available voice presets:
+
 ```bash
-bash demo/download_experimental_voices.sh
+# List all voices in table format (default)
+python demo/list_voices.py
+
+# List only English voices
+python demo/list_voices.py --lang en
+
+# Show statistics about available voices
+python demo/list_voices.py --stats
+
+# Output as JSON for programmatic use
+python demo/list_voices.py --format json
+
+# Simple list of voice names only
+python demo/list_voices.py --format simple
 ```
+
+The utility provides detailed information including speaker name, language, gender, and file size for each available voice preset.
+
+
 ## Risks and limitations
 
 While efforts have been made to optimize it through various techniques, it may still produce outputs that are unexpected, biased, or inaccurate. VibeVoice inherits any biases, errors, or omissions produced by its base model (specifically, Qwen2.5 0.5b in this release).