R-Kentaren
/

haha

Model card Files Files and versions

xet

Community

R-Kentaren commited on 16 days ago

Commit

8ec5670

verified ·

1 Parent(s): 55acefc

Delete colab.ipynb

Browse files

Files changed (1) hide show

colab.ipynb +0 -147

colab.ipynb DELETED Viewed

@@ -1,147 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "# Audio to Animalese Language Conversion (Colab)\n",
-        "\n",
-        "This Colab notebook lets you convert any audio file (spoken English, for example) into Animalese — the iconic gibberish speech from Animal Crossing games!\n",
-        "\n",
-        "## Features\n",
-        "- Upload any audio file (wav/mp3/m4a, etc.)\n",
-        "- Transcribe to text (using `openai-whisper` or `speech_recognition`)\n",
-        "- Convert text to Animalese audio (using pitch-shifted, sped-up syllable samples)\n",
-        "- Download the final Animalese audio\n",
-        "\n",
-        "---"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "metadata": {},
-      "source": [
-        "#@title 1. Install dependencies\n",
-        "!pip install gTTS pydub librosa soundfile openai-whisper --quiet\n",
-        "!apt-get install -y ffmpeg\n",
-        "\n",
-        "import os\n",
-        "from gtts import gTTS\n",
-        "from pydub import AudioSegment\n",
-        "import librosa\n",
-        "import soundfile as sf\n",
-        "import tempfile\n",
-        "import torch\n",
-        "import whisper"
-      ],
-      "execution_count": null,
-      "outputs": []
-    },
-    {
-      "cell_type": "code",
-      "metadata": {},
-      "source": [
-        "#@title 2. Upload your audio file\n",
-        "from google.colab import files\n",
-        "\n",
-        "uploaded = files.upload()\n",
-        "input_audio_path = list(uploaded.keys())[0]\n",
-        "print('Audio uploaded:', input_audio_path)"
-      ],
-      "execution_count": null,
-      "outputs": []
-    },
-    {
-      "cell_type": "code",
-      "metadata": {},
-      "source": [
-        "#@title 3. Transcribe audio to text (English)\n",
-        "model = whisper.load_model('base')\n",
-        "result = model.transcribe(input_audio_path)\n",
-        "transcription = result['text']\n",
-        "print('Transcription:', transcription)"
-      ],
-      "execution_count": null,
-      "outputs": []
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "## Animalese Synthesizer Function\n",
-        "This function splits text into syllables and plays a pitch-shifted, short 'beep' per syllable to mimic Animalese."
-      ]
-    },
-    {
-      "cell_type": "code",
-      "metadata": {},
-      "source": [
-        "#@title 4. Animalese Synthesizer\n",
-        "import numpy as np\n",
-        "\n",
-        "def text_to_animalese(text, out_path='animalese.wav', base_pitch=220, speed=1.3):\n",
-        "    # Generate a single \"beep\" (vowel-like tone)\n",
-        "    def beep(pitch=220, dur_ms=80):\n",
-        "        sr = 22050\n",
-        "        t = np.linspace(0, dur_ms/1000, int(sr * dur_ms/1000), False)\n",
-        "        tone = np.sin(pitch*2*np.pi*t)\n",
-        "        tone *= np.hanning(len(t))  # fade in/out\n",
-        "        return np.int16(tone * 32767)\n",
-        "    \n",
-        "    import re\n",
-        "    # Split text into syllables (very rough, English only)\n",
-        "    text = text.lower()\n",
-        "    syllables = re.findall(r'[aeiouy]+|[^aeiouy\\W]+', text)\n",
-        "    \n",
-        "    # Map each syllable to a pitch for variety\n",
-        "    vowels = 'aeiouy'\n",
-        "    audio = np.array([], dtype=np.int16)\n",
-        "    for i, syl in enumerate(syllables):\n",
-        "        if syl.strip() == '':\n",
-        "            continue\n",
-        "        # Pitch shifts for variety\n",
-        "        pitch = base_pitch + 40 * (i % 5)\n",
-        "        beep_snd = beep(pitch=pitch)\n",
-        "        audio = np.concatenate([audio, beep_snd])\n",
-        "    \n",
-        "    # Speed up\n",
-        "    audio_fast = librosa.effects.time_stretch(audio.astype(np.float32)/32768.0, speed)\n",
-        "    sf.write(out_path, audio_fast, 22050)\n",
-        "    print(f'Animalese audio saved to {out_path}')\n",
-        "\n",
-        "animalese_out = 'animalese.wav'\n",
-        "text_to_animalese(transcription, animalese_out)"
-      ],
-      "execution_count": null,
-      "outputs": []
-    },
-    {
-      "cell_type": "code",
-      "metadata": {},
-      "source": [
-        "#@title 5. Listen and Download Animalese Audio\n",
-        "import IPython.display as ipd\n",
-        "ipd.display(ipd.Audio(animalese_out))\n",
-        "files.download(animalese_out)"
-      ],
-      "execution_count": null,
-      "outputs": []
-    }
-  ],
-  "metadata": {
-    "colab": {
-      "collapsed_sections": [],
-      "name": "Audio to Animalese Colab"
-    },
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "name": "python"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}