[sound] Plugin refactor.

- Added `input_format`/`output_format` options to both input and output audio streams. - Replaced the previous (confusing) occurrences of `ffmpeg_format` and `format`. - Added custom `dtype` option for `sound.play`. - Added `join` flag (default: false) to `sound.play` to wait for the playback to finish.
2023-10-31 01:41:13 +01:00 · 2023-10-31 01:41:13 +01:00 · f960ec4bf4
commit f960ec4bf4
parent d5514d7f27
8 changed files with 115 additions and 58 deletions
--- a/platypush/plugins/sound/init.py
+++ b/platypush/plugins/sound/init.py
@ -86,8 +86,11 @@ class SoundPlugin(RunnablePlugin):
        sample_rate: Optional[int] = None,
        channels: int = 2,
        volume: float = 100,
        dtype: Optional[str] = None,
        format: Optional[str] = None,  # pylint: disable=redefined-builtin
        stream_name: Optional[str] = None,
        stream_index: Optional[int] = None,
        join: bool = False,
    ):
        """
        Plays an audio file/URL (any audio format supported by ffmpeg works) or
@ -159,6 +162,12 @@ class SoundPlugin(RunnablePlugin):
        :param channels: Number of audio channels. Default: number of channels
            in the audio file in file mode, 1 if in synth mode
        :param volume: Playback volume, between 0 and 100. Default: 100.
        :param dtype: Data type for the audio samples, if playing raw PCM audio
            frames. Supported types: 'float64', 'float32', 'int32', 'int16',
            'int8', 'uint8'.
        :param format: Output audio format, if you want to convert the audio to
            another format before playing it. The list of available formats can
            be retrieved through the ``ffmpeg -formats`` command. Default: None
        :param stream_index: If specified, play to an already active stream
            index (you can get them through :meth:`.query_streams`). Default:
            creates a new audio stream through PortAudio.
@ -167,6 +176,8 @@ class SoundPlugin(RunnablePlugin):
            name will be created. If not set, and ``stream_index`` is not set
            either, then a new stream will be created on the next available
            index and named ``platypush-stream-<index>``.
        :param join: If True, then the method will block until the playback is
            completed. Default: False.
        """
        dev = self._manager.get_device(device=device, type=StreamType.OUTPUT)
@ -193,7 +204,13 @@ class SoundPlugin(RunnablePlugin):
            stream_index,
        )
-        self._manager.create_player(
+        player_kwargs = {}
        if dtype:
            player_kwargs['dtype'] = dtype
        if format:
            player_kwargs['format'] = format
        player = self._manager.create_player(
            device=dev.index,
            infile=resource,
            sound=sound,
@ -203,7 +220,12 @@ class SoundPlugin(RunnablePlugin):
            channels=channels,
            volume=volume,
            stream_name=stream_name,
-        ).start()
+            **player_kwargs,
        )
        player.start()
        if join:
            player.join()
    @action
    def stream_recording(self, *args, **kwargs):
@ -255,7 +277,7 @@ class SoundPlugin(RunnablePlugin):
        :param sample_rate: Recording sample rate (default: device default rate)
        :param dtype: Data type for the audio samples. Supported types:
            'float64', 'float32', 'int32', 'int16', 'int8', 'uint8'. Default:
-            float32
+            int16.
        :param blocksize: Audio block size (default: configured
            `input_blocksize` or 2048)
        :param play_audio: If True, then the recorded audio will be played in
--- a/platypush/plugins/sound/_converters/_base.py
+++ b/platypush/plugins/sound/_converters/_base.py
@ -7,8 +7,9 @@ from threading import Event, RLock, Thread
 from typing import Any, Callable, Coroutine, Iterable, Optional
 from platypush.context import get_or_create_event_loop
 from platypush.utils import is_debug_enabled
-_dtype_to_ffmpeg_format = {
+dtype_to_ffmpeg_format = {
    'int8': 's8',
    'uint8': 'u8',
    'int16': 's16le',
@ -46,7 +47,8 @@ class AudioConverter(Thread, ABC):
        volume: float,
        dtype: str,
        chunk_size: int,
-        format: Optional[str] = None,  # pylint: disable=redefined-builtin
+        input_format: Optional[str] = None,  # pylint: disable=redefined-builtin
        output_format: Optional[str] = None,  # pylint: disable=redefined-builtin
        on_exit: Optional[Callable[[], Any]] = None,
        **kwargs,
    ):
@ -58,24 +60,20 @@ class AudioConverter(Thread, ABC):
        :param dtype: The (numpy) data type of the raw input/output audio.
        :param chunk_size: Number of bytes that will be read at once from the
            ffmpeg process.
-        :param format: Input/output audio format.
+        :param input_format: Input audio format.
        :param output_format: Output audio format.
        :param on_exit: Function to call when the ffmpeg process exits.
        """
        super().__init__(*args, **kwargs)
        ffmpeg_format = _dtype_to_ffmpeg_format.get(dtype)
        assert ffmpeg_format, (
            f'Unsupported data type: {dtype}. Supported data types: '
            f'{list(_dtype_to_ffmpeg_format.keys())}'
        )
        self._ffmpeg_bin = ffmpeg_bin
        self._ffmpeg_format = ffmpeg_format
        self._ffmpeg_task: Optional[Coroutine] = None
        self._sample_rate = sample_rate
        self._channels = channels
        self._chunk_size = chunk_size
-        self._format = format
+        self._input_format = input_format
        self._output_format = output_format
        self._dtype = dtype
        self._closed = False
        self._out_queue = Queue()
        self.ffmpeg = None
@ -120,7 +118,8 @@ class AudioConverter(Thread, ABC):
        """
        Set of arguments common to all ffmpeg converter instances.
        """
-        return ('-hide_banner', '-loglevel', 'warning', '-y')
+        log_level = 'debug' if is_debug_enabled() else 'warning'
        return ('-hide_banner', '-loglevel', log_level, '-y')
    @property
    @abstractmethod
@ -150,20 +149,6 @@ class AudioConverter(Thread, ABC):
            return args + ('-channel_layout', 'stereo')
        return args
    @property
    def _raw_ffmpeg_args(self) -> Iterable[str]:
        """
        Ffmpeg arguments for raw audio input/output given the current
        configuration.
        """
        return (
            '-f',
            self._ffmpeg_format,
            '-ar',
            str(self._sample_rate),
            *self._channel_layout_args,
        )
    @property
    def _audio_volume_args(self) -> Iterable[str]:
        """
@ -197,23 +182,6 @@ class AudioConverter(Thread, ABC):
        """
        return PIPE
    @property
    def _compressed_ffmpeg_args(self) -> Iterable[str]:
        """
        Ffmpeg arguments for the compressed audio given the current
        configuration.
        """
        if not self._format:
            return ()
        ffmpeg_args = self._format_to_ffmpeg_args.get(self._format)
        assert ffmpeg_args, (
            f'Unsupported output format: {self._format}. Supported formats: '
            f'{list(self._format_to_ffmpeg_args.keys())}'
        )
        return ffmpeg_args
    async def _audio_proxy(self, timeout: Optional[float] = None):
        """
        Proxy the converted audio stream to the output queue for downstream
@ -236,11 +204,6 @@ class AudioConverter(Thread, ABC):
        self.logger.info('Running ffmpeg: %s', ' '.join(ffmpeg_args))
        try:
            await asyncio.wait_for(self.ffmpeg.wait(), 0.1)
        except asyncio.TimeoutError:
            pass
        while (
            self._loop
            and self.ffmpeg
@ -298,6 +261,9 @@ class AudioConverter(Thread, ABC):
            self._loop.run_until_complete(self._ffmpeg_task)
        except RuntimeError as e:
            self.logger.warning(e)
        except Exception as e:
            self.logger.warning('Audio converter error: %s', e)
            self.logger.exception(e)
        finally:
            self.stop()
--- a/platypush/plugins/sound/_converters/_from_raw.py
+++ b/platypush/plugins/sound/_converters/_from_raw.py
@ -1,6 +1,6 @@
 from typing import Iterable
-from ._base import AudioConverter
+from ._base import AudioConverter, dtype_to_ffmpeg_format
 class RawInputAudioConverter(AudioConverter):
@ -8,13 +8,42 @@ class RawInputAudioConverter(AudioConverter):
    Converts raw audio input to a compressed media format.
    """
    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        if self._dtype and not self._input_format:
            ffmpeg_format = dtype_to_ffmpeg_format.get(self._dtype)
            assert ffmpeg_format, (
                f'Unsupported data type: {self._dtype}. Supported data types: '
                f'{list(dtype_to_ffmpeg_format.keys())}'
            )
            self._input_format = ffmpeg_format
    @property
    def _input_format_args(self) -> Iterable[str]:
-        return self._raw_ffmpeg_args
+        args = (
            '-ar',
            str(self._sample_rate),
            *self._channel_layout_args,
        )
        if self._input_format:
            args = ('-f', self._input_format) + args
        return args
    @property
    def _output_format_args(self) -> Iterable[str]:
-        return self._compressed_ffmpeg_args
+        if not self._output_format:
            return ()
        ffmpeg_args = self._format_to_ffmpeg_args.get(self._output_format)
        assert ffmpeg_args, (
            f'Unsupported output format: {self._output_format}. Supported formats: '
            f'{list(self._format_to_ffmpeg_args.keys())}'
        )
        return ffmpeg_args
 # vim:sw=4:ts=4:et:
--- a/platypush/plugins/sound/_converters/_to_raw.py
+++ b/platypush/plugins/sound/_converters/_to_raw.py
@ -1,6 +1,6 @@
 from typing import Iterable
-from ._base import AudioConverter
+from ._base import AudioConverter, dtype_to_ffmpeg_format
 class RawOutputAudioConverter(AudioConverter):
@ -8,13 +8,40 @@ class RawOutputAudioConverter(AudioConverter):
    Converts input audio to raw audio output.
    """
    def __init__(self, *args, **kwargs):
        super().__init__(*args, **kwargs)
        if self._dtype and not self._output_format:
            ffmpeg_format = dtype_to_ffmpeg_format.get(self._dtype)
            assert ffmpeg_format, (
                f'Unsupported data type: {self._dtype}. Supported data types: '
                f'{list(dtype_to_ffmpeg_format.keys())}'
            )
            self._output_format = ffmpeg_format
    @property
    def _input_format_args(self) -> Iterable[str]:
-        return self._compressed_ffmpeg_args
+        if not self._input_format:
            return ()
        ffmpeg_args = self._format_to_ffmpeg_args.get(self._input_format)
        if not ffmpeg_args:
            return ('-f', self._input_format)
        return ffmpeg_args
    @property
    def _output_format_args(self) -> Iterable[str]:
-        return self._raw_ffmpeg_args
+        args = (
            '-ar',
            str(self._sample_rate),
            *self._channel_layout_args,
        )
        if self._output_format:
            args = ('-f', self._output_format) + args
        return args
 class RawOutputAudioFromFileConverter(RawOutputAudioConverter):
--- a/platypush/plugins/sound/_manager/_main.py
+++ b/platypush/plugins/sound/_manager/_main.py
@ -61,6 +61,7 @@ class AudioManager:
        duration: Optional[float] = None,
        sample_rate: Optional[int] = None,
        dtype: str = 'int16',
        format: Optional[str] = None,  # pylint: disable=redefined-builtin
        blocksize: Optional[int] = None,
        latency: Union[float, str] = 'high',
        stream_name: Optional[str] = None,
@ -77,6 +78,7 @@ class AudioManager:
        :param duration: Duration of the stream in seconds.
        :param sample_rate: Sample rate of the stream.
        :param dtype: Data type of the stream.
        :param format: Output format of the stream.
        :param blocksize: Block size of the stream.
        :param latency: Latency of the stream.
        :param stream_name: Name of the stream.
@ -93,6 +95,7 @@ class AudioManager:
            blocksize=blocksize or self.output_blocksize,
            latency=latency,
            channels=channels,
            output_format=format,
            queue_size=self.queue_size,
            should_stop=self._should_stop,
        )
--- a/platypush/plugins/sound/_streams/_base.py
+++ b/platypush/plugins/sound/_streams/_base.py
@ -43,6 +43,8 @@ class AudioThread(Thread, ABC):
        infile: Optional[str] = None,
        outfile: Optional[str] = None,
        duration: Optional[float] = None,
        input_format: Optional[str] = None,
        output_format: Optional[str] = None,
        latency: Union[float, str] = 'high',
        redis_queue: Optional[str] = None,
        should_stop: Optional[Event] = None,
@ -66,6 +68,8 @@ class AudioThread(Thread, ABC):
            stream.
        :param outfile: Path to the output file.
        :param duration: Duration of the audio stream.
        :param input_format: Input format override.
        :param output_format: Output format override.
        :param latency: Latency to use.
        :param redis_queue: Redis queue to use.
        :param should_stop: Synchronize with upstream stop events.
@ -83,6 +87,8 @@ class AudioThread(Thread, ABC):
        self.volume = volume
        self.sample_rate = sample_rate
        self.dtype = dtype
        self.input_format = input_format
        self.output_format = output_format
        self.stream = stream
        self.duration = duration
        self.blocksize = blocksize * channels
@ -349,6 +355,9 @@ class AudioThread(Thread, ABC):
            self.logger.warning(
                'Audio callback timeout for %s', self.__class__.__name__
            )
        except Exception as e:
            self.logger.warning('Unhandled sound on %s', self.__class__.__name__)
            self.logger.exception(e)
        finally:
            self.notify_stop()
--- a/platypush/plugins/sound/_streams/_player/_resource.py
+++ b/platypush/plugins/sound/_streams/_player/_resource.py
@ -20,6 +20,7 @@ class AudioResourcePlayer(AudioPlayer):
    def _converter_args(self) -> dict:
        return {
            'infile': self.infile,
            'output_format': self.output_format,
            **super()._converter_args,
        }
--- a/platypush/plugins/sound/_streams/_recorder.py
+++ b/platypush/plugins/sound/_streams/_recorder.py
@ -81,7 +81,7 @@ class AudioRecorder(AudioThread):
    @property
    def _converter_args(self) -> dict:
        return {
-            'format': self.output_format,
+            'output_format': self.output_format,
            **super()._converter_args,
        }