freelawproject · mlissner · Jun 27, 2024 · Jun 26, 2024 · Jun 26, 2024 · Jun 26, 2024
diff --git a/doctor/forms.py b/doctor/forms.py
@@ -44,7 +44,7 @@ class AudioForm(BaseAudioFile):
     audio_data = forms.JSONField(label="audio-data", required=False)
 
     def clean(self):
-        self.cleaned_data["fp"] = f"/tmp/audio_{uuid.uuid4().hex}.mp3"
+        self.cleaned_data["fp"] = f"/tmp/audio_{uuid.uuid4().hex}"
         if self.cleaned_data.get("file", None):
             filename = self.cleaned_data["file"].name
             self.cleaned_data["extension"] = filename.split(".")[-1]

diff --git a/doctor/tasks.py b/doctor/tasks.py
@@ -479,6 +479,47 @@ def convert_to_mp3(output_path: AnyStr, media: Any) -> None:
     return output_path
 
 
+def convert_to_ogg(output_path: AnyStr, media: Any) -> None:
+    """Converts audio data to the ogg format (.ogg)
+
+    This function uses ffmpeg to convert the audio data provided in `media` to
+    the ogg format with the following specifications:
+
+    * Single audio channel (`-ac 1`)
+    * 8 kHz sampling rate (`-b:a 8k`)
+    * Optimized for voice over IP applications (`-application voip`)
+
+    :param output_path: Audio file bytes sent to Doctor
+    :param media: Temporary filepath for output of audioprocess
+    :return:
+    """
+    av_command = [
+        "ffmpeg",
+        "-i",
+        "/dev/stdin",
+        "-vn",
+        "-map_metadata",
+        "-1",
+        "-ac",
+        "1",
+        "-c:a",
+        "libopus",
+        "-b:a",
+        "8k",
+        "-application",
+        "voip",
+        "-f",
+        "ogg",
+        output_path,
+    ]
+
+    ffmpeg_cmd = subprocess.Popen(
+        av_command, stdin=subprocess.PIPE, stdout=subprocess.PIPE, shell=False
+    )
+    ffmpeg_cmd.communicate(media.read())
+    return output_path
+
+
 def set_mp3_meta_data(
     audio_data: Dict, mp3_path: AnyStr
 ) -> eyed3.core.AudioFile:

diff --git a/doctor/urls.py b/doctor/urls.py
@@ -1,4 +1,4 @@
-from django.urls import path
+from django.urls import path, re_path
 
 from . import views
 
@@ -23,7 +23,9 @@
         views.make_png_thumbnails_from_range,
         name="thumbnails",
     ),
-    path("convert/audio/mp3/", views.convert_audio, name="convert-audio"),
+    re_path(
+        "convert/audio/(mp3|ogg)/", views.convert_audio, name="convert-audio"
+    ),
     path("utils/page-count/pdf/", views.page_count, name="page_count"),
     path("utils/mime-type/", views.extract_mime_type, name="mime_type"),
     path(

diff --git a/doctor/views.py b/doctor/views.py
@@ -34,6 +34,7 @@
 from doctor.tasks import (
     convert_tiff_to_pdf_bytes,
     convert_to_mp3,
+    convert_to_ogg,
     download_images,
     extract_from_doc,
     extract_from_docx,
@@ -367,8 +368,11 @@ def fetch_audio_duration(request) -> HttpResponse:
         return HttpResponse(str(e))
 
 
-def convert_audio(request) -> Union[FileResponse, HttpResponse]:
-    """Convert audio file to MP3 and update metadata on mp3.
+def convert_audio(
+    request, output_format: str
+) -> Union[FileResponse, HttpResponse]:
+    """Converts an uploaded audio file to the specified output format and
+    updates its metadata.
 
     :return: Converted audio
     """
@@ -378,8 +382,14 @@ def convert_audio(request) -> Union[FileResponse, HttpResponse]:
     filepath = form.cleaned_data["fp"]
     media_file = form.cleaned_data["file"]
     audio_data = {k: v[0] for k, v in dict(request.GET).items()}
-    convert_to_mp3(filepath, media_file)
-    set_mp3_meta_data(audio_data, filepath)
+    match output_format:
+        case "mp3":
+            convert_to_mp3(filepath, media_file)
+            set_mp3_meta_data(audio_data, filepath)
+        case "ogg":
+            convert_to_ogg(filepath, media_file)
+        case _:
+            raise NotImplemented
     response = FileResponse(open(filepath, "rb"))
     cleanup_form(form)
     return response