{ "cells": [ { "cell_type": "code", "execution_count": 1, "id": "9d8dbc75-dacc-457f-890c-c3d70f1e24ff", "metadata": { "tags": [] }, "outputs": [], "source": [ "import os\n", "from pathlib import Path\n", "\n", "from lhotse import CutSet\n", "from lhotse.cut import Cut, MonoCut\n", "from lhotse.recipes import (\n", " download_voxceleb1,\n", " download_voxceleb2,\n", " hifitts,\n", " libritts,\n", " prepare_voxceleb,\n", ")\n", "from lhotse.dataset import (\n", " SimpleCutSampler,\n", " UnsupervisedDataset\n", ")\n", "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 2, "id": "181a454e-1e74-40fd-8d5b-765b65bf6111", "metadata": { "tags": [] }, "outputs": [], "source": [ "# Dataset root path\n", "root_dir = Path(\"datasets_cache\")\n", "\n", "# datasets paths\n", "hifitts_path = root_dir / \"hifitts\"\n", "libritts_path = root_dir / \"libritts\"\n", "librittsr_path = root_dir / \"librittsr\"\n", "\n", "num_jobs = os.cpu_count() - 3" ] }, { "cell_type": "code", "execution_count": 3, "id": "7e6c3a68-b4e9-46ea-89b2-4aeed61f4a64", "metadata": { "tags": [] }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "Downloading LibriTTS parts: 0%| | 0/1 [00:00