fix formatting in whisper notebook (#2281)

eaidova · web-flow · commit d0ed4fe83377 · 2024-08-12T11:20:10.000+04:00
diff --git a/notebooks/whisper-subtitles-generation/whisper-subtitles-generation.ipynb b/notebooks/whisper-subtitles-generation/whisper-subtitles-generation.ipynb
@@ -461,9 +461,7 @@
    "source": [
     "inputs, duration = get_audio(output_file)\n",
     "\n",
-    "transcription = pipe(\n",
-    "    inputs, generate_kwargs={\"task\": task.value}, return_timestamps=True\n",
-    ")[\"chunks\"]"
+    "transcription = pipe(inputs, generate_kwargs={\"task\": task.value}, return_timestamps=True)[\"chunks\"]"
    ]
   },
   {
@@ -491,9 +489,7 @@
     "    seconds = milliseconds // 1_000\n",
     "    milliseconds -= seconds * 1_000\n",
     "\n",
-    "    return (\n",
-    "        f\"{hours}:\" if hours > 0 else \"00:\"\n",
-    "    ) + f\"{minutes:02d}:{seconds:02d},{milliseconds:03d}\"\n",
+    "    return (f\"{hours}:\" if hours > 0 else \"00:\") + f\"{minutes:02d}:{seconds:02d},{milliseconds:03d}\"\n",
     "\n",
     "\n",
     "def prepare_srt(transcription, filter_duration=None):\n",
@@ -506,10 +502,7 @@
     "        if segment[\"timestamp\"][1] is None:\n",
     "            segment[\"timestamp\"] = (segment[\"timestamp\"][0], filter_duration)\n",
     "\n",
-    "        if filter_duration is not None and (\n",
-    "            segment[\"timestamp\"][0] >= math.floor(filter_duration)\n",
-    "            or segment[\"timestamp\"][1] > math.ceil(filter_duration) + 1\n",
-    "        ):\n",
+    "        if filter_duration is not None and (segment[\"timestamp\"][0] >= math.floor(filter_duration) or segment[\"timestamp\"][1] > math.ceil(filter_duration) + 1):\n",
     "            break\n",
     "        segment_lines.append(str(idx + 1) + \"\\n\")\n",
     "        time_start = format_timestamp(segment[\"timestamp\"][0])\n",
@@ -1257,9 +1250,7 @@
     "        feature_extractor=processor.feature_extractor,\n",
     "    )\n",
     "    inputs, duration = get_audio(output_file)\n",
-    "    transcription = int8_pipe(\n",
-    "        inputs, generate_kwargs={\"task\": task.value}, return_timestamps=True\n",
-    "    )[\"chunks\"]\n",
+    "    transcription = int8_pipe(inputs, generate_kwargs={\"task\": task.value}, return_timestamps=True)[\"chunks\"]\n",
     "    srt_lines = prepare_srt(transcription, filter_duration=duration)\n",
     "    print(\"\".join(srt_lines))\n",
     "    widgets.Video.from_file(output_file, loop=False, width=800, height=800)"
@@ -1429,9 +1420,7 @@
     "        ydl.download(link.value)\n",
     "    inputs, duration = get_audio(output_file)\n",
     "    m_pipe = int8_pipe if use_int8 else pipe\n",
-    "    transcription = m_pipe(\n",
-    "        inputs, generate_kwargs={\"task\": task.lower()}, return_timestamps=True\n",
-    "    )[\"chunks\"]\n",
+    "    transcription = m_pipe(inputs, generate_kwargs={\"task\": task.lower()}, return_timestamps=True)[\"chunks\"]\n",
     "    srt_lines = prepare_srt(transcription, duration)\n",
     "    with output_file.with_suffix(\".srt\").open(\"w\") as f:\n",
     "        f.writelines(srt_lines)\n",