moises-ai
diff --git a/‎maestro_worker_python/convert_files.py‎
Lines changed: 75 additions & 16 deletions b/‎maestro_worker_python/convert_files.py‎
Lines changed: 75 additions & 16 deletions
diff --git a/‎tests/silent with space.ogg‎
4.02 KB b/‎tests/silent with space.ogg‎
4.02 KB
diff --git a/‎tests/silent with space.wav‎
174 KB b/‎tests/silent with space.wav‎
174 KB
diff --git a/‎tests/test_convert_files.py‎
Lines changed: 119 additions & 36 deletions b/‎tests/test_convert_files.py‎
Lines changed: 119 additions & 36 deletions
@@ -1,14 +1,14 @@
 from __future__ import annotations
 
-import tempfile
+import concurrent.futures
 import logging
 import subprocess
-import concurrent.futures
-
+import tempfile
+from contextlib import contextmanager
 from dataclasses import dataclass
 from typing import List
+
 from .response import ValidationError
-from contextlib import contextmanager
 
 logger = logging.getLogger(__name__)
 
@@ -32,11 +32,17 @@ def convert_files(convert_files: List[FileToConvert]):
     futures = []
     with concurrent.futures.ThreadPoolExecutor() as executor:
         for convert_file in convert_files:
-            target_function = _convert_to_m4a if convert_file.file_format == "m4a" else _convert_to_wav
+            target_function = (
+                _convert_to_m4a
+                if convert_file.file_format == "m4a"
+                else _convert_to_wav
+            )
             futures.append(
                 executor.submit(
-                    target_function, convert_file.input_file_path, convert_file.output_file_path,
-                    convert_file.max_duration
+                    target_function,
+                    convert_file.input_file_path,
+                    convert_file.output_file_path,
+                    convert_file.max_duration,
                 )
             )
 
@@ -55,10 +61,17 @@ def convert_files_manager(*convert_files: FileToConvert) -> None | str | list[st
             for convert_file in convert_files:
                 file_format = ".m4a" if convert_file.file_format == "m4a" else ".wav"
                 filename = tempfile.NamedTemporaryFile(suffix=file_format)
-                target_function = _convert_to_m4a if convert_file.file_format == "m4a" else _convert_to_wav
+                target_function = (
+                    _convert_to_m4a
+                    if convert_file.file_format == "m4a"
+                    else _convert_to_wav
+                )
                 thread_list.append(
                     executor.submit(
-                        target_function, convert_file.input_file_path, filename.name, convert_file.max_duration
+                        target_function,
+                        convert_file.input_file_path,
+                        filename.name,
+                        convert_file.max_duration,
                     )
                 )
                 list_objects.append(filename)
@@ -77,27 +90,68 @@ def convert_files_manager(*convert_files: FileToConvert) -> None | str | list[st
 
 
 def _convert_to_wav(input_file_path, output_file_path, max_duration):
-    _run_subprocess(f"ffmpeg -y -hide_banner -loglevel error -t {max_duration} -i {input_file_path} -ar 44100 {output_file_path}")
+    _run_subprocess(
+        [
+            "ffmpeg",
+            "-y",
+            "-hide_banner",
+            "-loglevel",
+            "error",
+            "-t",
+            str(max_duration),
+            "-i",
+            str(input_file_path),
+            "-ar",
+            "44100",
+            str(output_file_path),
+        ]
+    )
 
 
 def _convert_to_m4a(input_file_path, output_file_path, max_duration):
-    _run_subprocess(f"ffmpeg -y -hide_banner -loglevel error -t {max_duration} -i {input_file_path} -c:a aac -b:a 192k -ar 44100 -movflags +faststart {output_file_path}")
+    _run_subprocess(
+        [
+            "ffmpeg",
+            "-y",
+            "-hide_banner",
+            "-loglevel",
+            "error",
+            "-t",
+            str(max_duration),
+            "-i",
+            str(input_file_path),
+            "-c:a",
+            "aac",
+            "-b:a",
+            "192k",
+            "-ar",
+            "44100",
+            "-movflags",
+            "+faststart",
+            str(output_file_path),
+        ]
+    )
 
 
 def _run_subprocess(command):
     try:
-        process = subprocess.run(command, shell=True, capture_output=True, check=True)
+        process = subprocess.run(command, shell=False, capture_output=True, check=True)
     except subprocess.CalledProcessError as exc:
         invalid_file_errors = [
             "Invalid data found when processing input",
             "Output file #0 does not contain any stream",
             "Output file does not contain any stream",
-            "Invalid argument"
+            "Invalid argument",
         ]
         if any(error in exc.stderr.decode() for error in invalid_file_errors):
             logger.warning(
-               "Could not convert because the file is invalid",
-                extra={"props": {"stderr": exc.stderr.decode(), "stdout": exc.stdout.decode()}}
+                "Could not convert because the file is invalid",
+                extra={
+                    "props": {
+                        "stderr": exc.stderr.decode(),
+                        "stdout": exc.stdout.decode(),
+                    }
+                },
             )
             raise ValidationError(
                 f"Could not convert because the file is invalid, ffmpeg stderr: {exc.stderr.decode()}"
@@ -110,6 +164,11 @@ def _run_subprocess(command):
         if process.stderr:
             logger.warning(
                 "Non-falal error during conversion",
-                extra={"props": {"stderr": process.stderr.decode(), "stdout": process.stdout.decode()}}
+                extra={
+                    "props": {
+                        "stderr": process.stderr.decode(),
+                        "stdout": process.stdout.decode(),
+                    }
+                },
             )
         logger.info(f"Conversion output: {process.stdout.decode()}")
@@ -1,11 +1,17 @@
-import os
-import pytest
 import hashlib
+import os
 import subprocess
 from pathlib import Path
-from maestro_worker_python.convert_files import convert_files_manager, convert_files, FileToConvert, FileConversionError
-from maestro_worker_python.response import ValidationError
 
+import pytest
+
+from maestro_worker_python.convert_files import (
+    FileConversionError,
+    FileToConvert,
+    convert_files,
+    convert_files_manager,
+)
+from maestro_worker_python.response import ValidationError
 
 TEST_PATH = Path(__file__).resolve().parent
 
@@ -28,72 +34,126 @@ def corrupt_audio_file(tmp_path_factory):
 def test_should_re_raise_exceptions_in_thread(invalid_audio_file, file_format):
     with pytest.raises(FileConversionError) as exc:
         convert_files(
-            [FileToConvert(
-                input_file_path=TEST_PATH / "foobar.mp3",
-                output_file_path=f"{invalid_audio_file}.wav",
-                file_format=file_format,
-            )]
+            [
+                FileToConvert(
+                    input_file_path=TEST_PATH / "foobar.mp3",
+                    output_file_path=f"{invalid_audio_file}.wav",
+                    file_format=file_format,
+                )
+            ]
         )
 
 
 @pytest.mark.parametrize("file_format", ["m4a", "wav"])
-def test_should_raise_validation_error_if_audio_file_is_invalid(invalid_audio_file, file_format):
+def test_should_raise_validation_error_if_audio_file_is_invalid(
+    invalid_audio_file, file_format
+):
     with pytest.raises(ValidationError) as exc:
         convert_files(
-            [FileToConvert(
-                input_file_path=invalid_audio_file,
-                output_file_path=f"{invalid_audio_file}.wav",
-                file_format=file_format,
-            )]
+            [
+                FileToConvert(
+                    input_file_path=invalid_audio_file,
+                    output_file_path=f"{invalid_audio_file}.wav",
+                    file_format=file_format,
+                )
+            ]
         )
 
     assert "Invalid data" in str(exc.value)
 
 
 @pytest.mark.parametrize("file_format", ["m4a", "wav"])
-def test_should_raise_validation_error_if_audio_file_is_corrupt(corrupt_audio_file, file_format):
+def test_should_raise_validation_error_if_audio_file_is_corrupt(
+    corrupt_audio_file, file_format
+):
     with pytest.raises(ValidationError) as exc:
         convert_files(
-            [FileToConvert(
-                input_file_path=corrupt_audio_file,
-                output_file_path=f"{corrupt_audio_file}.wav",
-                file_format=file_format
-            )]
+            [
+                FileToConvert(
+                    input_file_path=corrupt_audio_file,
+                    output_file_path=f"{corrupt_audio_file}.wav",
+                    file_format=file_format,
+                )
+            ]
         )
 
     assert "Invalid argument" in str(exc.value)
 
 
 @pytest.mark.parametrize("file_format", ["m4a", "wav"])
 def test_should_raise_validation_error_if_source_has_no_audio(file_format, caplog):
-    input_file_path, output_file_path = TEST_PATH / "video-no-audio.mp4", TEST_PATH / "output.wav"
+    input_file_path, output_file_path = (
+        TEST_PATH / "video-no-audio.mp4",
+        TEST_PATH / "output.wav",
+    )
     with pytest.raises(ValidationError) as exc:
         convert_files(
-            [FileToConvert(
-                input_file_path=input_file_path,
-                output_file_path=output_file_path,
-                file_format=file_format,
-            )]
+            [
+                FileToConvert(
+                    input_file_path=input_file_path,
+                    output_file_path=output_file_path,
+                    file_format=file_format,
+                )
+            ]
         )
 
     assert "does not contain any strea" in str(exc.value)
 
 
-def test_should_convert_valid_audio_file():
-    input_file_path, output_file_path = TEST_PATH / "silent.ogg", TEST_PATH / "silent.wav"
+@pytest.mark.parametrize(
+    "input_name, output_name, format",
+    [
+        ("silent.ogg", "converted.wav", "wav"),
+        ("silent with space.ogg", "converted.wav", "wav"),
+    ],
+)
+def test_should_convert_valid_wav_audio_file(input_name, output_name, format):
+    input_file_path, output_file_path = (
+        TEST_PATH / input_name,
+        TEST_PATH / output_name,
+    )
     convert_files(
-        [FileToConvert(
-            input_file_path=input_file_path,
-            output_file_path=output_file_path,
-            file_format="wav",
-        )]
+        [
+            FileToConvert(
+                input_file_path=input_file_path,
+                output_file_path=output_file_path,
+                file_format=format,
+            )
+        ]
     )
     assert _get_hash(input_file_path) == _get_hash(output_file_path)
     Path(output_file_path).unlink(missing_ok=True)
 
 
+@pytest.mark.parametrize(
+    "input_name, output_name, format",
+    [
+        ("silent.ogg", "converted.m4a", "m4a"),
+        ("silent with space.wav", "converted.m4a", "m4a"),
+    ],
+)
+def test_should_convert_valid_m4a_audio_file(input_name, output_name, format):
+    input_file_path, output_file_path = (
+        TEST_PATH / input_name,
+        TEST_PATH / output_name,
+    )
+    convert_files(
+        [
+            FileToConvert(
+                input_file_path=input_file_path,
+                output_file_path=output_file_path,
+                file_format=format,
+            )
+        ]
+    )
+    Path(output_file_path).unlink(missing_ok=True)
+
+
 def test_should_convert_multiple_valid_audio_files_and_delete_after_context():
-    input_file_path, output_file_path = TEST_PATH / "silent.ogg", TEST_PATH / "silent.wav"
+    input_file_path, output_file_path = (
+        TEST_PATH / "silent.ogg",
+        TEST_PATH / "silent.wav",
+    )
     converted_files_list = []
     with convert_files_manager(
         FileToConvert(
@@ -115,6 +175,29 @@ def test_should_convert_multiple_valid_audio_files_and_delete_after_context():
 def _get_hash(file_name):
     process = subprocess.run(
         f"ffmpeg -loglevel error -i {file_name} -map 0 -f hash -",
-        shell=True, capture_output=True, check=True,
+        shell=True,
+        capture_output=True,
+        check=True,
+    )
+    return process.stdout.split(b"=")[1].strip()
+
+
+def _get_hash(file_name):
+    process = subprocess.run(
+        [
+            "ffmpeg",
+            "-loglevel",
+            "error",
+            "-i",
+            str(file_name),
+            "-map",
+            "0",
+            "-f",
+            "hash",
+            "-",
+        ],
+        shell=False,
+        capture_output=True,
+        check=True,
     )
     return process.stdout.split(b"=")[1].strip()