simple_ffmpeg_batch_io.AudioIO API documentation

AudioIO(*, logLevel=16, debugMode=False) View Source

222    def __init__(self, *, logLevel = 16, debugMode = False):
223        """
224        Create a VideoIO object giving ffmpeg/ffrobe loglevel and defining debug mode
225
226        Parameters
227        ----------
228        log_level: int (default 16)
229            Log level to pass to the underlying ffmpeg/ffprobe command.
230
231        debugMode: bool (default (False)
232            Show debug info. while processing video
233        """
234
235        self.mode = PipeMode.UNK_MODE
236        self.logLevel = logLevel
237        self.debugMode = debugMode
238
239        # Call init() method
240        self.init()

Create a VideoIO object giving ffmpeg/ffrobe loglevel and defining debug mode

Parameters

log_level: int (default 16) Log level to pass to the underlying ffmpeg/ffprobe command.

debugMode: bool (default (False) Show debug info. while processing video

@classmethod

def reader(cls, filename, **kwargs): View Source

50    @classmethod
51    def reader(cls, filename, **kwargs):
52        """
53        Create and open an AudioIO object in reader mode
54
55        See ``AudioIO.open`` for the full list of accepted parameters.
56        """
57        reader = cls()
58        reader.open(filename, **kwargs)
59        return reader

Create and open an AudioIO object in reader mode

See AudioIO.open for the full list of accepted parameters.

@classmethod

def writer(cls, filename, sample_rate, channels, **kwargs): View Source

61    @classmethod
62    def writer(cls, filename, sample_rate, channels, **kwargs):
63        """
64        Create and open an AudioIO object in writer mode
65
66        See ``AudioIO.create`` for the full list of accepted parameters.
67        """
68        writer = cls()
69        writer.create(filename, sample_rate, channels, **kwargs)
70        return writer

Create and open an AudioIO object in writer mode

See AudioIO.create for the full list of accepted parameters.

@staticmethod

def get_time_in_sec(filename, *, debug=False, logLevel=16): View Source

 88    @staticmethod
 89    def get_time_in_sec(filename, *, debug=False, logLevel=16):
 90        """
 91        Static method to get length of an audio file (or video file containing audio) in seconds including milliseconds as decimal part (3 decimals).
 92
 93        Parameters
 94        ----------
 95        filename : str or path. 
 96            Raw audio waveform as a 1D array.
 97
 98        debug : bool (default False).
 99            Show debug info.
100
101        log_level: int (default 16).
102            Log level to pass to the underlying ffmpeg/ffprobe command.
103        
104        Returns
105        ----------
106        float
107            Length in seconds of video file (including milliseconds as decimal part with 3 decimals)
108        """
109        
110        cmd = [AudioIO.paramProgram, # ffprobe
111                    '-hide_banner',
112                    '-loglevel', str(logLevel),
113                    '-show_entries', 'format=duration',
114                    '-of', 'default=noprint_wrappers=1:nokey=1',
115                    filename
116                    ]
117
118        if debug == True:
119            print(' '.join(cmd))
120
121        # call ffprobe and get params in one single line
122        lpipe = sp.Popen(cmd, stdout=sp.PIPE, stdin=sp.PIPE) # stdin=sp.PIPE to prevent manipulation of shell echo mode by ffmpeg
123        output = lpipe.stdout.readlines()
124        lpipe.terminate()
125        # transform Bytes output to one single string
126        output = ''.join( [element.decode('utf-8') for element in output])
127
128        try:
129            return float(output)
130        except (ValueError, TypeError):
131            return None

Static method to get length of an audio file (or video file containing audio) in seconds including milliseconds as decimal part (3 decimals).

Parameters

filename : str or path. Raw audio waveform as a 1D array.

debug : bool (default False). Show debug info.

log_level: int (default 16). Log level to pass to the underlying ffmpeg/ffprobe command.

Returns

float Length in seconds of video file (including milliseconds as decimal part with 3 decimals)

@staticmethod

def get_params(filename, *, debug=False, logLevel=16): View Source

133    @staticmethod
134    def get_params(filename, *, debug=False, logLevel=16):
135        """
136        Static method to get params (channels,sample_rate) of a (video containing) audio file in seconds.
137
138        Parameters
139        ----------
140        filename : str or path.
141            Raw audio waveform as a 1D array.
142
143        debug : bool (default (False).
144            Show debug info.
145
146        log_level: int (default 16).
147            Log level to pass to the underlying ffmpeg/ffprobe command.
148
149        Returns
150        ----------
151        tuple
152            Tuple containing (channels,sample_rate) of the file
153        """
154        cmd = [AudioIO.paramProgram, # ffprobe
155                    '-hide_banner',
156                    '-loglevel', str(logLevel),
157                    '-show_entries', 'stream=channels,sample_rate',
158                    filename
159                    ]
160
161        if debug == True:
162            print(' '.join(cmd))
163
164        # call ffprobe and get params in one single line
165        lpipe = sp.Popen(cmd, stdout=sp.PIPE, stdin=sp.PIPE) # stdin=sp.PIPE to prevent manipulation of shell echo mode by ffmpeg
166        output = lpipe.stdout.readlines()
167        lpipe.terminate()
168        # transform Bytes output to one single string
169        output = ''.join( [element.decode('utf-8') for element in output])
170
171        pattern_sample_rate = r'sample_rate=(\d+)'
172        pattern_channels = r'channels=(\d+)'
173
174        # Search for values in the ffprobe output
175        match_sample_rate = re.search(pattern_sample_rate, output, flags=re.MULTILINE)
176        match_channels = re.search(pattern_channels, output, flags=re.MULTILINE)
177
178        # Extraction des valeurs
179        if match_sample_rate:
180            sample_rate = int(match_sample_rate.group(1))
181        else:
182            raise AudioIO.AudioIOException("Unable to get audio sample_rate of '" + str(filename) + "'")
183
184        if match_channels:
185            channels = int(match_channels.group(1))
186        else:
187            raise AudioIO.AudioIOException("Unable to get audio channels of '" + str(filename) + "'")
188
189        return (channels,sample_rate)
190
191        # Attributes
192        mode: PipeMode
193        """ Pipemode of the current object (default PipeMode.UNK_MODE)"""
194
195        loglevel: int
196        """ loglevel of the underlying ffmpeg backend for this object (default 16)"""
197
198        debugModel: bool
199        """ debutMode flag for this object (print debut info, default False)"""
200
201        channels: int
202        """ Number of channels of images (default -1) """
203
204        sample_rate: int
205        """ sample_rate of images (default -1) """
206
207        plannar: bool
208        """ Read/write data as plannar, i.e. not interleaved (default True) """
209
210        pipe: sp.Popen
211        """ pipe object to ffmpeg/ffprobe (default None)"""
212
213        frame_size: int
214        """ Weight in bytes of one image (default -1)"""
215
216        filename: str
217        """ Filename of the file (default None)"""
218
219        frame_counter: FrameCounter
220        """ `Framecounter` object to count ellapsed time (default None)"""

Static method to get params (channels,sample_rate) of a (video containing) audio file in seconds.

Parameters

filename : str or path. Raw audio waveform as a 1D array.

debug : bool (default (False). Show debug info.

log_level: int (default 16). Log level to pass to the underlying ffmpeg/ffprobe command.

Returns

tuple Tuple containing (channels,sample_rate) of the file

mode

logLevel

debugMode

def init(self): View Source

242    def init(self):
243        """
244        Init or reinit a VideoIO object.
245        """
246        self.channels  = -1
247        self.sample_rate = -1
248        self.plannar = True
249        self.pipe = None
250        self.frame_size = -1
251        self.filename = None
252        self.frame_counter = None

Init or reinit a VideoIO object.

def get_elapsed_time_as_str(self) -> str: View Source

272    def get_elapsed_time_as_str(self) -> str:
273        """
274        Method to get elapsed time (float value represented) as str.
275
276        Returns
277        ----------
278        str or None
279            Elapsed time (float value) as str, "15.500" for instance for 15 secondes and 500 milliseconds
280            None if no frame counter are available.
281        """
282        if self.frame_counter is None:
283            return None
284        return self.frame_counter.get_elapsed_time_as_str()

Method to get elapsed time (float value represented) as str.

Returns

str or None Elapsed time (float value) as str, "15.500" for instance for 15 secondes and 500 milliseconds None if no frame counter are available.

def get_formated_elapsed_time_as_str(self, show_ms=True) -> str: View Source

286    def get_formated_elapsed_time_as_str(self,show_ms=True) -> str:
287        """
288        Method to get elapsed time (hour format) as str.
289
290        Returns
291        ----------
292        str or None
293            Elapsed time (float value) as str, "00:00:15.500" for instance for 15 secondes and 500 milliseconds
294            None if no frame counter are available.
295        """
296        if self.frame_counter is None:
297            return None
298        return self.frame_counter.get_formated_elapsed_time_as_str()

Method to get elapsed time (hour format) as str.

Returns

str or None Elapsed time (float value) as str, "00:00:15.500" for instance for 15 secondes and 500 milliseconds None if no frame counter are available.

def get_elapsed_time(self) -> float: View Source

300    def get_elapsed_time(self) -> float:
301        """
302        Method to get elapsed time as float value rounded to 3 decimals.
303
304        Returns
305        ----------
306        float or None
307            Elapsed time (float value) as str, 15.500 for instance for 15 secondes and 500 milliseconds
308            None if no frame counter are available.
309        """
310        if self.frame_counter is None:
311            return None
312        return self.frame_counter.get_elapsed_time()

Method to get elapsed time as float value rounded to 3 decimals.

Returns

float or None Elapsed time (float value) as str, 15.500 for instance for 15 secondes and 500 milliseconds None if no frame counter are available.

def is_opened(self) -> bool: View Source

314    def is_opened(self) -> bool:
315        """
316        Method to get status of the underlying pipe to ffmpeg.
317
318        Returns
319        ----------
320        bool
321            True if pipe is opened (reading or writing mode), False if not.
322        """
323        # is the pip opened?
324        if self.pipe is not None and self.pipe.poll() is None:
325            return True
326
327        return False

Method to get status of the underlying pipe to ffmpeg.

Returns

bool True if pipe is opened (reading or writing mode), False if not.

def close(self): View Source

329    def close(self):
330        """
331        Method to close current pipe to ffmpeg (if any). Ffmpeg/ffprobe  will be terminated. Object can be reused using open or create methods.
332        """
333        if self.pipe is not None:
334            if self.mode == PipeMode.WRITE_MODE:
335                # killing will make ffmpeg not finish properly the job, close the pipe
336                # to let it know that no more data are comming
337                self.pipe.stdin.close()
338            else: # self.mode == PipeMode.READ_MODE
339                # in read mode, no need to be nice, send SIGTERM on Linux,/Kill it on windows
340                self.pipe.kill()
341
342            # wait for subprocess to end
343            self.pipe.wait()
344
345        # reinit object for later use
346        self.init()

Method to close current pipe to ffmpeg (if any). Ffmpeg/ffprobe will be terminated. Object can be reused using open or create methods.

def create( self, filename, sample_rate, channels, *, writeOverExistingFile=False, outputEncoding=<AudioFormat.PCM32LE: 'pcm_f32le'>, encodingParams=None, plannar=True): View Source

348    def create( self, filename, sample_rate, channels, *, writeOverExistingFile = False,
349                outputEncoding = AudioFormat.PCM32LE, encodingParams = None, plannar = True ):
350        """
351        Method to create a audio file using parametrized access through ffmpeg. Importante note: calling create
352        on a AudioIO will close any former open video.
353
354        Parameters
355        ----------
356        filename: str or path
357            filename of path to the file (mp4, avi, ...)
358
359        sample_rate: int
360            If defined as a positive value, sample_rates of the output file will be set to this value.
361
362        channels: int
363            If defined as a positive value, number of channels of output file will be set to this value.
364
365        fps:
366            If defined as a positive value, fps of input video will be set to this value.
367
368        outputEncoding: AudioFormat optional (default AudioFormat.PCM32LE)
369            Define audio format for samples. Possible value is AudioFormat.PCM32LE.
370
371        encodingParams: str optional (default None)
372            Parameter to pass to ffmpeg to encode video like audio filters.
373
374        plannar : bool optionnal (default True)
375            Input data to write are grouped by channel if True, interleaved instead.
376
377        Returns
378        ----------
379        bool
380            Was the creation successfull
381        """
382
383        # Close if already opened
384        self.close()
385
386        # Set geometry/fps of the video stream from params
387        self.sample_rate = int(sample_rate)
388        self.channels = int(channels)
389        self.plannar = plannar
390
391        # Check params
392        if self.sample_rate <= 0 or self.channels <= 0:
393            raise self.AudioIOException("Bad parameters: sample_rate={}, channels={}".format(self.sample_rate,self.channels))
394
395        # To write audio, we do not need to know in advance frame size, we will write x values of n bytes
396        self.frame_size = None
397
398        # Video params are set, open the video
399        cmd = [self.audioProgram] # ffmpeg
400
401        if writeOverExistingFile == True:
402            cmd.extend(['-y'])
403
404        cmd.extend(['-hide_banner',
405            '-nostats',
406            '-loglevel', str(self.logLevel),
407            '-f', 'f32le', '-acodec', outputEncoding.value, # input expected coding
408            '-ar', f"{self.sample_rate}",
409            '-ac', f"{self.channels}",
410            '-i', '-'])
411
412        if encodingParams is not None:
413            cmd.extend(encodingParams.split())
414
415        # remove video
416        cmd.extend( ['-vn', filename ] )
417
418        if self.debugMode == True:
419            print( ' '.join(cmd), file=sys.stderr )
420
421        # store filename and set mode
422        self.filename = filename
423        self.mode = PipeMode.WRITE_MODE
424
425        # call ffmpeg in write mode
426        try:
427            self.pipe = sp.Popen(cmd, stdin=sp.PIPE)
428            self.frame_counter = FrameCounter(self.sample_rate)
429        except Exception as e:
430            # if pipe failed, reinit object and raise exception
431            self.init()
432            raise
433
434        return True

Method to create a audio file using parametrized access through ffmpeg. Importante note: calling create on a AudioIO will close any former open video.

Parameters

filename: str or path filename of path to the file (mp4, avi, ...)

sample_rate: int If defined as a positive value, sample_rates of the output file will be set to this value.

channels: int If defined as a positive value, number of channels of output file will be set to this value.

fps: If defined as a positive value, fps of input video will be set to this value.

outputEncoding: AudioFormat optional (default AudioFormat.PCM32LE) Define audio format for samples. Possible value is AudioFormat.PCM32LE.

encodingParams: str optional (default None) Parameter to pass to ffmpeg to encode video like audio filters.

plannar : bool optionnal (default True) Input data to write are grouped by channel if True, interleaved instead.

Returns

bool Was the creation successfull

def open( self, filename, *, sample_rate=-1, channels=-1, inputEncoding=<AudioFormat.PCM32LE: 'pcm_f32le'>, decodingParams=None, frame_size=1.0, plannar=True, start_time=0.0): View Source

436    def open( self, filename, *, sample_rate = -1, channels = -1, inputEncoding = AudioFormat.PCM32LE,
437                    decodingParams = None, frame_size = 1.0, plannar = True, start_time = 0.0 ):
438        """
439        Method to read (video file containing) audio using parametrized access through ffmpeg. Importante note: calling open
440        on a AudioIO will close any former open file.
441
442        Parameters
443        ----------
444        filename: str or path
445            filename of path to the file (mp4, avi, ...)
446
447        sample_rate: int optional (default -1)
448            If defined as a positive value, sample rate of the input audio will be converted to this value.
449
450        channels: int optional (default -1)
451            If defined as a positive value, number of channels of the input audio will converted to this value.
452
453        inputEncoding: AudioFormat optional (default AudioFormat.PCM32LE)
454            Define audio format for samples. Possible value is AudioFormat.PCM32LE.
455
456        decodingParams: str optional (default None)
457            Parameter to pass to ffmpeg to decode video like audio filters.
458
459        plannar: bool optionnal (default True)
460            Group audio samples per channel if True. Else, samples are interleaved.
461
462        frame_size: int or float (default 1.0)
463            If frame_size is an int, it is the number of expected samples in each frame, for instance 8000 for 8000 samples.
464            if frame_size is a float, it is considered as a time in seconds for each audio frame, for instance 1.0 for 1 second, 0.010 for 10 ms.
465            Number of samples in this case is computed using frame_size and sample_rate as int(frame_size * sample_rate)
466
467        start_time: float optional (default 0.0)
468            Define the reading start time. If not set, reading at beginning of the file.
469
470        Returns
471        ----------
472        bool
473            Was the opening successfull
474        """
475
476        # Close if already opened
477        self.close()
478
479        # Force conversion of parameters
480        channels = int(channels)
481        sample_rate = float(sample_rate)
482
483        self.plannar = plannar
484
485        # get parameters from file if needed:
486        if sample_rate <= 0 or channels <= 0:
487            self.channels, self.sample_rate = self.getAudioParams(filename)
488
489        # check if parameters ask to overide video parameters
490        if channels > 0:
491            self.channels = channels
492        if sample_rate > 0:
493            self.sample_rate = sample_rate
494
495        # check parameters
496
497        if isinstance(frame_size,float):
498            # time in seconds
499            self.frame_size = int(frame_size*self.sample_rate)
500        elif isinstance(frame_size,int):
501            # number of samples
502            self.frame_size = frame_size
503        else:
504            # to do
505            pass
506
507        # Video params are set, open the video
508        cmd = [self.audioProgram, # ffmpeg
509                    '-hide_banner',
510                    '-nostats',
511                    '-loglevel', str(self.logLevel)]
512
513        if decodingParams is not None:
514            cmd.extend([decodingParams.split()])
515
516        if start_time < 0.0:
517            pass
518        elif start_time > 0.0:
519            cmd.extend(["-ss", f"{start_time}"])            
520
521        cmd.extend( ['-i', filename,
522                     '-f', 'f32le', '-acodec', inputEncoding.value, # input expected coding
523                     '-ar', f"{self.sample_rate}",
524                     '-ac', f"{self.channels}",
525                     '-' # output to stdout
526                    ]
527                )
528
529        if self.debugMode == True:
530            print( ' '.join(cmd) )
531
532        # store filename and set mode to READ_MODE
533        self.filename = filename
534        self.mode = PipeMode.READ_MODE
535
536        # call ffmpeg in read mode
537        try:
538            self.pipe = sp.Popen(cmd, stdout=sp.PIPE, stdin=sp.PIPE) # stdin=sp.PIPE to prevent manipulation of shell echo mode by ffmpeg/ffprobe
539            self.frame_counter = FrameCounter(self.sample_rate)
540            if start_time > 0.0:
541                self.frame_counter += start_time # adding with float means adding time
542        except Exception as e:
543            # if pipe failed, reinit object and raise exception
544            self.init()
545            raise
546
547        return True

Method to read (video file containing) audio using parametrized access through ffmpeg. Importante note: calling open on a AudioIO will close any former open file.

Parameters

filename: str or path filename of path to the file (mp4, avi, ...)

sample_rate: int optional (default -1) If defined as a positive value, sample rate of the input audio will be converted to this value.

channels: int optional (default -1) If defined as a positive value, number of channels of the input audio will converted to this value.

inputEncoding: AudioFormat optional (default AudioFormat.PCM32LE) Define audio format for samples. Possible value is AudioFormat.PCM32LE.

decodingParams: str optional (default None) Parameter to pass to ffmpeg to decode video like audio filters.

plannar: bool optionnal (default True) Group audio samples per channel if True. Else, samples are interleaved.

frame_size: int or float (default 1.0) If frame_size is an int, it is the number of expected samples in each frame, for instance 8000 for 8000 samples. if frame_size is a float, it is considered as a time in seconds for each audio frame, for instance 1.0 for 1 second, 0.010 for 10 ms. Number of samples in this case is computed using frame_size and sample_rate as int(frame_size * sample_rate)

start_time: float optional (default 0.0) Define the reading start time. If not set, reading at beginning of the file.

Returns

bool Was the opening successfull

def read_frame(self, with_timestamps=False): View Source

549    def read_frame(self, with_timestamps = False):
550        """
551        Read next frame from the audio file
552
553        Parameters
554        ----------
555        with_timestamps: bool optional (default False)
556            If set to True, the method returns a ``FrameContainer`` with the audio and an array containing the associated timestamp(s)
557
558        Returns
559        ----------
560        nparray or FrameContainer
561            A frame of shape (self.channels,self.frame_size) as defined in the reader/open call if self.plannar is True. A frame
562            of shape (self.channels*self.frame_size) with interleaved data if self.plannar is False.
563            if with_timestamps is True, the return object is a FrameContainer with the audio data in ``FrameContainer.data`` and
564            the associated timestamp in ``FrameContainer.timestamps`` as an array (one element).
565        """
566
567        if self.pipe is None:
568            raise self.AudioIOException("No pipe opened to {}. Call open(...) before reading a frame.".format(self.audioProgram))
569        # - pipe is in write mode
570        if self.mode != PipeMode.READ_MODE:
571            raise self.AudioIOException("Pipe to {} for '{}' not opened in read mode.".format(self.audioProgram, self.filename))
572
573        if with_timestamps:
574            # get elapsed time in video, it is time of next frame(s)
575            current_elapsed_time = self.get_elapsed_time()
576
577        # read rgb image from pipe
578        toread = self.frame_size*4
579        buffer = self.pipe.stdout.read(toread)
580        if len(buffer) != toread:
581            # not considered as an error, no more frame, no exception
582            return None
583
584        # get numpy UINT8 array from buffer
585        audio = np.frombuffer(buffer, dtype = np.float32).reshape(self.frame_size, self.channels)
586
587        # make it plannar (or not)
588        if self.plannar:
589            #transpose it
590            audio = audio.T
591
592        # increase frame_counter
593        self.frame_counter.frame_count += (self.frame_size * self.channels)
594
595        # say to gc that this buffer is no longer needed
596        del buffer
597
598        if with_timestamps:
599            return FrameContainer(1, audio, self.frame_size/self.sample_rate, current_elapsed_time)
600        
601        return audio

Parameters

with_timestamps: bool optional (default False) If set to True, the method returns a FrameContainer with the audio and an array containing the associated timestamp(s)

Returns

nparray or FrameContainer A frame of shape (self.channels,self.frame_size) as defined in the reader/open call if self.plannar is True. A frame of shape (self.channels*self.frame_size) with interleaved data if self.plannar is False. if with_timestamps is True, the return object is a FrameContainer with the audio data in FrameContainer.data and the associated timestamp in FrameContainer.timestamps as an array (one element).

def read_batch(self, numberOfFrames, with_timestamps=False): View Source

603    def read_batch(self, numberOfFrames, with_timestamps = False):
604        """
605        Read next batch of audio from the file
606
607        Parameters
608        ----------
609        number_of_frames: int
610            Number of desired images within the batch. The last batch from the file may have less images.
611            
612        with_timestamps: bool optional (default False)
613            If set to True, the method returns a FrameContainer with the batch and the an array containing the associated timestamps to frames
614
615        Returns
616        ----------
617        nparray or FrameContainer
618            A batch of shape (n, self.channels,self.frame_size) as defined in the reader/open call if self.plannar is True. A batch
619            of shape (n, self.channels*self.frame_size) with interleaved data if self.plannar is False.
620            if with_timestamps is True, the return object is a FrameContainer with the audio batch in ``FrameContainer.data`` and
621            the associated timestamp in ``FrameContainer.timestamps`` as an array (one element for each audio frame).
622        """
623
624        if self.pipe is None:
625            raise self.AudioIOException("No pipe opened to {}. Call open(...) before reading frames.".format(self.audioProgram))
626        # - pipe is in write mode
627        if self.mode != PipeMode.READ_MODE:
628            raise self.AudioIOException("Pipe to {} for '{}' not opened in read mode.".format(self.audioProgram, self.filename))
629
630        if with_timestamps:
631            # get elapsed time in video, it is time of next frame(s)
632            current_elapsed_time = self.get_elapsed_time()
633
634        # try to read complete batch
635        toread = self.frame_size*4*self.channels*numberOfFrames
636        buffer = self.pipe.stdout.read(toread)
637
638        # check if we have at least 1 Frame
639        if len(buffer) < toread:
640            # not considered as an error, no more frame, no exception
641            return None
642
643        # compute actual number of Frames
644        actualNbFrames = len(buffer)//(self.frame_size*4*self.channels)
645
646        # get and reshape batch from buffer
647        batch = np.frombuffer(buffer, dtype = np.float32).reshape((actualNbFrames, self.frame_size, self.channels,))
648
649        if self.plannar:
650            batch = batch.transpose(0, 2, 1)
651
652        # increase frame_counter
653        self.frame_counter.frame_count += (actualNbFrames * self.frame_size * self.channels)
654        
655        # say to gc that this buffer is no longer needed
656        del buffer
657
658        if with_timestamps:
659            return FrameContainer( actualNbFrames, batch, self.frame_size/self.sample_rate, current_elapsed_time)
660        
661        return batch

Parameters

number_of_frames: int Number of desired images within the batch. The last batch from the file may have less images.

with_timestamps: bool optional (default False) If set to True, the method returns a FrameContainer with the batch and the an array containing the associated timestamps to frames

Returns

nparray or FrameContainer A batch of shape (n, self.channels,self.frame_size) as defined in the reader/open call if self.plannar is True. A batch of shape (n, self.channels*self.frame_size) with interleaved data if self.plannar is False. if with_timestamps is True, the return object is a FrameContainer with the audio batch in FrameContainer.data and the associated timestamp in FrameContainer.timestamps as an array (one element for each audio frame).

def write_frame(self, audio) -> bool: View Source

663    def write_frame(self, audio) -> bool:
664        """
665        Write an audio frame to the file
666
667        Parameters
668        ----------
669        audio: nparray
670            The audio frame to write to the video file of shape (self.channels,nb_samples_per_channel) if plannar is True else (self.channels*nb_samples_per_channel).
671
672        Returns
673        ----------
674        bool
675            Writing was successful or not.
676        """
677        # Check params
678        # - pipe exists
679        if self.pipe is None:
680            raise self.AudioIOException("No pipe opened to {}. Call create(...) before writing frames.".format(self.audioProgram))
681        # - pipe is in write mode
682        if self.mode != PipeMode.WRITE_MODE:
683            raise self.AudioIOException("Pipe to {} for '{}' not opened in write mode.".format(self.audioProgram, self.filename))
684        # - shape of image is fine, thus we have pixels for a full compatible frame
685        if audio.shape[0] != self.channels:
686            raise self.AudioIOException("Wong audio shape: {} expected ({},{}).".format(audio.shape,self.channels,self.frame_size))
687        # - type of data is Float32
688        if audio.dtype != np.float32:
689            raise self.AudioIOException("Wong audio type: {} expected np.float32.".format(audio.dtype))
690
691        # array must have a shape (channels, samples), reshape it it to (samples, channels) if plannar
692        if not self.plannar:
693            audio = audio.reshape(-1)
694
695        # print( audio.shape )
696
697        # garantee to have a C continuous array
698        if not audio.flags['C_CONTIGUOUS']:
699            a = np.ascontiguousarray(a) 
700
701        # write frame
702        buffer = audio.tobytes()
703        if self.pipe.stdin.write( buffer ) < len(buffer):
704            print( f"Error writing frame to {self.filename}" )
705            return False
706
707        # increase frame_counter
708        self.frame_counter.frame_count += (self.frame_size * self.channels)
709
710        # say to gc that this buffer is no longer needed 
711        del buffer
712
713        return True

Write an audio frame to the file

Parameters

audio: nparray The audio frame to write to the video file of shape (self.channels,nb_samples_per_channel) if plannar is True else (self.channels*nb_samples_per_channel).

Returns

bool Writing was successful or not.

def write_batch(self, batch): View Source

715    def write_batch(self, batch):
716        """
717        Write a batch of audio frame to the file
718
719        Parameters
720        ----------
721        batch: nparray
722            The batch of audio frames to write to the video file of shape (n,self.channels,nb_samples_per_channel) if plannar is True else (n,self.channels*nb_samples_per_channel) of interleaved audio data.
723
724        Returns
725        ----------
726        bool
727            Writing was successful or not.
728        """
729        # Check params
730        # - pipe exists
731        if self.pipe is None:
732            raise self.AudioIOException("No pipe opened to {}. Call create(...) before writing frames.".format(self.audioProgram))
733        # - pipe is in write mode
734        if self.mode != PipeMode.WRITE_MODE:
735            raise self.AudioIOException("Pipe to {} for '{}' not opened in write mode.".format(self.audioProgram, self.filename))
736        # batch is 3D (n, channels, nb samples)
737        if batch.ndim !=3:
738            raise self.AudioIOException("Wrong batch shape: {} expected 3 dimensions (n, n_channels, n_samples_per_channel).".format(batch.shape))
739        # - shape of images in batch is fine
740        if batch.shape[2] != self.channels:
741            raise self.AudioIOException("Wrong audio channels in batch: {} expected {} {}.".format(batch.shape[2], self.channels, batch.shape))
742
743        # array must have a shape (n * n_channels * n_samples_per_channel) before writing them to pipe
744        # reshape it it to (n * n_channels * n_samples_per_channel) if plannar is False
745        if not self.plannar:
746            # goes from (n, n_channels, n_samples_per_channel) to (n * n_channels * n_samples_per_channel)
747            batch = batch.transpose(0, 2, 1) # first go to (n, n_samples_per_channel, n_channels)
748            batch = batch.reshape(-1) # then to 1D array (n * n_channels * n_samples_per_channel)
749
750        # garantee to have a C continuous array
751        if not batch.flags['C_CONTIGUOUS']:
752            batch = np.ascontiguousarray(batch)
753
754        # write frame
755        buffer = batch.tobytes()
756        if self.pipe.stdin.write( buffer ) < len(buffer):
757            # say to gc that this buffer is no longer needed
758            del buffer
759            raise self.AudioIOException("Error writing batch to '{}'.".format(self.filename))
760
761        # increase frame_counter
762        self.frame_counter.frame_count += int(batch.shape[0]/self.channels) # int conversion is mandatory to avoid confusion with time as float
763              
764        # say to gc that this buffer is no longer needed
765        del buffer
766
767        return True

Write a batch of audio frame to the file

Parameters

batch: nparray The batch of audio frames to write to the video file of shape (n,self.channels,nb_samples_per_channel) if plannar is True else (n,self.channels*nb_samples_per_channel) of interleaved audio data.

Returns

bool Writing was successful or not.

def iter_frames(self, with_timestamps=False): View Source

769    def iter_frames(self, with_timestamps = False):
770        """
771        Method to iterate on audio frames using AudioIO obj.
772        for audio_frame in obj.iter_frames():
773            ....
774
775        Parameters
776        ----------
777        with_timestamps: bool optional (default False)
778            If set to True, the method returns a FrameContainer object with the batch and an array containing the associated timestamps to frames
779
780        Returns
781        ----------
782        nparray or FrameContainer
783            A batch of images of shape ()
784        """
785
786        try:
787            if self.mode == PipeMode.READ_MODE:
788                while self.isOpened():
789                    frame = self.readFrame(with_timestamps)
790                    if frame is not None:
791                        yield frame
792        finally:
793            self.close()

Method to iterate on audio frames using AudioIO obj. for audio_frame in obj.iter_frames(): ....

Parameters

with_timestamps: bool optional (default False) If set to True, the method returns a FrameContainer object with the batch and an array containing the associated timestamps to frames

Returns

nparray or FrameContainer A batch of images of shape ()

def iter_batches(self, batch_size: int, with_timestamps=False): View Source

795    def iter_batches(self, batch_size : int, with_timestamps = False ):
796        """
797        Method to iterate on batch ofaudio  frames using VideoIO obj.
798        for audio_batch in obj.iter_batches():
799            ....
800
801        Parameters
802        ----------
803        with_timestamps: bool optional (default False)
804            If set to True, the method returns a FrameContainer with the batch and the an array containing the associated timestamps to frames
805        """
806        try:
807            if self.mode == PipeMode.READ_MODE:
808                while self.isOpened():
809                    batch = self.readBatch(batch_size, with_timestamps)
810                    if batch is not None:
811                        yield batch
812        finally:
813            self.close()

Method to iterate on batch ofaudio frames using VideoIO obj. for audio_batch in obj.iter_batches(): ....

Parameters

with_timestamps: bool optional (default False) If set to True, the method returns a FrameContainer with the batch and the an array containing the associated timestamps to frames

@staticmethod

def getAudioTimeInSec(filename, *, debug=False, logLevel=16): View Source

 88    @staticmethod
 89    def get_time_in_sec(filename, *, debug=False, logLevel=16):
 90        """
 91        Static method to get length of an audio file (or video file containing audio) in seconds including milliseconds as decimal part (3 decimals).
 92
 93        Parameters
 94        ----------
 95        filename : str or path. 
 96            Raw audio waveform as a 1D array.
 97
 98        debug : bool (default False).
 99            Show debug info.
100
101        log_level: int (default 16).
102            Log level to pass to the underlying ffmpeg/ffprobe command.
103        
104        Returns
105        ----------
106        float
107            Length in seconds of video file (including milliseconds as decimal part with 3 decimals)
108        """
109        
110        cmd = [AudioIO.paramProgram, # ffprobe
111                    '-hide_banner',
112                    '-loglevel', str(logLevel),
113                    '-show_entries', 'format=duration',
114                    '-of', 'default=noprint_wrappers=1:nokey=1',
115                    filename
116                    ]
117
118        if debug == True:
119            print(' '.join(cmd))
120
121        # call ffprobe and get params in one single line
122        lpipe = sp.Popen(cmd, stdout=sp.PIPE, stdin=sp.PIPE) # stdin=sp.PIPE to prevent manipulation of shell echo mode by ffmpeg
123        output = lpipe.stdout.readlines()
124        lpipe.terminate()
125        # transform Bytes output to one single string
126        output = ''.join( [element.decode('utf-8') for element in output])
127
128        try:
129            return float(output)
130        except (ValueError, TypeError):
131            return None

Static method to get length of an audio file (or video file containing audio) in seconds including milliseconds as decimal part (3 decimals).

Parameters

filename : str or path. Raw audio waveform as a 1D array.

debug : bool (default False). Show debug info.

log_level: int (default 16). Log level to pass to the underlying ffmpeg/ffprobe command.

Returns

float Length in seconds of video file (including milliseconds as decimal part with 3 decimals)

@staticmethod

def getAudioParams(filename, *, debug=False, logLevel=16): View Source

133    @staticmethod
134    def get_params(filename, *, debug=False, logLevel=16):
135        """
136        Static method to get params (channels,sample_rate) of a (video containing) audio file in seconds.
137
138        Parameters
139        ----------
140        filename : str or path.
141            Raw audio waveform as a 1D array.
142
143        debug : bool (default (False).
144            Show debug info.
145
146        log_level: int (default 16).
147            Log level to pass to the underlying ffmpeg/ffprobe command.
148
149        Returns
150        ----------
151        tuple
152            Tuple containing (channels,sample_rate) of the file
153        """
154        cmd = [AudioIO.paramProgram, # ffprobe
155                    '-hide_banner',
156                    '-loglevel', str(logLevel),
157                    '-show_entries', 'stream=channels,sample_rate',
158                    filename
159                    ]
160
161        if debug == True:
162            print(' '.join(cmd))
163
164        # call ffprobe and get params in one single line
165        lpipe = sp.Popen(cmd, stdout=sp.PIPE, stdin=sp.PIPE) # stdin=sp.PIPE to prevent manipulation of shell echo mode by ffmpeg
166        output = lpipe.stdout.readlines()
167        lpipe.terminate()
168        # transform Bytes output to one single string
169        output = ''.join( [element.decode('utf-8') for element in output])
170
171        pattern_sample_rate = r'sample_rate=(\d+)'
172        pattern_channels = r'channels=(\d+)'
173
174        # Search for values in the ffprobe output
175        match_sample_rate = re.search(pattern_sample_rate, output, flags=re.MULTILINE)
176        match_channels = re.search(pattern_channels, output, flags=re.MULTILINE)
177
178        # Extraction des valeurs
179        if match_sample_rate:
180            sample_rate = int(match_sample_rate.group(1))
181        else:
182            raise AudioIO.AudioIOException("Unable to get audio sample_rate of '" + str(filename) + "'")
183
184        if match_channels:
185            channels = int(match_channels.group(1))
186        else:
187            raise AudioIO.AudioIOException("Unable to get audio channels of '" + str(filename) + "'")
188
189        return (channels,sample_rate)
190
191        # Attributes
192        mode: PipeMode
193        """ Pipemode of the current object (default PipeMode.UNK_MODE)"""
194
195        loglevel: int
196        """ loglevel of the underlying ffmpeg backend for this object (default 16)"""
197
198        debugModel: bool
199        """ debutMode flag for this object (print debut info, default False)"""
200
201        channels: int
202        """ Number of channels of images (default -1) """
203
204        sample_rate: int
205        """ sample_rate of images (default -1) """
206
207        plannar: bool
208        """ Read/write data as plannar, i.e. not interleaved (default True) """
209
210        pipe: sp.Popen
211        """ pipe object to ffmpeg/ffprobe (default None)"""
212
213        frame_size: int
214        """ Weight in bytes of one image (default -1)"""
215
216        filename: str
217        """ Filename of the file (default None)"""
218
219        frame_counter: FrameCounter
220        """ `Framecounter` object to count ellapsed time (default None)"""

Static method to get params (channels,sample_rate) of a (video containing) audio file in seconds.

Parameters

filename : str or path. Raw audio waveform as a 1D array.

debug : bool (default (False). Show debug info.

log_level: int (default 16). Log level to pass to the underlying ffmpeg/ffprobe command.

Returns

tuple Tuple containing (channels,sample_rate) of the file

@staticmethod

def get_audio_time_in_sec(filename, *, debug=False, logLevel=16): View Source

 88    @staticmethod
 89    def get_time_in_sec(filename, *, debug=False, logLevel=16):
 90        """
 91        Static method to get length of an audio file (or video file containing audio) in seconds including milliseconds as decimal part (3 decimals).
 92
 93        Parameters
 94        ----------
 95        filename : str or path. 
 96            Raw audio waveform as a 1D array.
 97
 98        debug : bool (default False).
 99            Show debug info.
100
101        log_level: int (default 16).
102            Log level to pass to the underlying ffmpeg/ffprobe command.
103        
104        Returns
105        ----------
106        float
107            Length in seconds of video file (including milliseconds as decimal part with 3 decimals)
108        """
109        
110        cmd = [AudioIO.paramProgram, # ffprobe
111                    '-hide_banner',
112                    '-loglevel', str(logLevel),
113                    '-show_entries', 'format=duration',
114                    '-of', 'default=noprint_wrappers=1:nokey=1',
115                    filename
116                    ]
117
118        if debug == True:
119            print(' '.join(cmd))
120
121        # call ffprobe and get params in one single line
122        lpipe = sp.Popen(cmd, stdout=sp.PIPE, stdin=sp.PIPE) # stdin=sp.PIPE to prevent manipulation of shell echo mode by ffmpeg
123        output = lpipe.stdout.readlines()
124        lpipe.terminate()
125        # transform Bytes output to one single string
126        output = ''.join( [element.decode('utf-8') for element in output])
127
128        try:
129            return float(output)
130        except (ValueError, TypeError):
131            return None

Static method to get length of an audio file (or video file containing audio) in seconds including milliseconds as decimal part (3 decimals).

Parameters

filename : str or path. Raw audio waveform as a 1D array.

debug : bool (default False). Show debug info.

log_level: int (default 16). Log level to pass to the underlying ffmpeg/ffprobe command.

Returns

float Length in seconds of video file (including milliseconds as decimal part with 3 decimals)

@staticmethod

def get_audio_params(filename, *, debug=False, logLevel=16): View Source

133    @staticmethod
134    def get_params(filename, *, debug=False, logLevel=16):
135        """
136        Static method to get params (channels,sample_rate) of a (video containing) audio file in seconds.
137
138        Parameters
139        ----------
140        filename : str or path.
141            Raw audio waveform as a 1D array.
142
143        debug : bool (default (False).
144            Show debug info.
145
146        log_level: int (default 16).
147            Log level to pass to the underlying ffmpeg/ffprobe command.
148
149        Returns
150        ----------
151        tuple
152            Tuple containing (channels,sample_rate) of the file
153        """
154        cmd = [AudioIO.paramProgram, # ffprobe
155                    '-hide_banner',
156                    '-loglevel', str(logLevel),
157                    '-show_entries', 'stream=channels,sample_rate',
158                    filename
159                    ]
160
161        if debug == True:
162            print(' '.join(cmd))
163
164        # call ffprobe and get params in one single line
165        lpipe = sp.Popen(cmd, stdout=sp.PIPE, stdin=sp.PIPE) # stdin=sp.PIPE to prevent manipulation of shell echo mode by ffmpeg
166        output = lpipe.stdout.readlines()
167        lpipe.terminate()
168        # transform Bytes output to one single string
169        output = ''.join( [element.decode('utf-8') for element in output])
170
171        pattern_sample_rate = r'sample_rate=(\d+)'
172        pattern_channels = r'channels=(\d+)'
173
174        # Search for values in the ffprobe output
175        match_sample_rate = re.search(pattern_sample_rate, output, flags=re.MULTILINE)
176        match_channels = re.search(pattern_channels, output, flags=re.MULTILINE)
177
178        # Extraction des valeurs
179        if match_sample_rate:
180            sample_rate = int(match_sample_rate.group(1))
181        else:
182            raise AudioIO.AudioIOException("Unable to get audio sample_rate of '" + str(filename) + "'")
183
184        if match_channels:
185            channels = int(match_channels.group(1))
186        else:
187            raise AudioIO.AudioIOException("Unable to get audio channels of '" + str(filename) + "'")
188
189        return (channels,sample_rate)
190
191        # Attributes
192        mode: PipeMode
193        """ Pipemode of the current object (default PipeMode.UNK_MODE)"""
194
195        loglevel: int
196        """ loglevel of the underlying ffmpeg backend for this object (default 16)"""
197
198        debugModel: bool
199        """ debutMode flag for this object (print debut info, default False)"""
200
201        channels: int
202        """ Number of channels of images (default -1) """
203
204        sample_rate: int
205        """ sample_rate of images (default -1) """
206
207        plannar: bool
208        """ Read/write data as plannar, i.e. not interleaved (default True) """
209
210        pipe: sp.Popen
211        """ pipe object to ffmpeg/ffprobe (default None)"""
212
213        frame_size: int
214        """ Weight in bytes of one image (default -1)"""
215
216        filename: str
217        """ Filename of the file (default None)"""
218
219        frame_counter: FrameCounter
220        """ `Framecounter` object to count ellapsed time (default None)"""

Static method to get params (channels,sample_rate) of a (video containing) audio file in seconds.

Parameters

filename : str or path. Raw audio waveform as a 1D array.

debug : bool (default (False). Show debug info.

log_level: int (default 16). Log level to pass to the underlying ffmpeg/ffprobe command.

Returns

tuple Tuple containing (channels,sample_rate) of the file

def isOpened(self) -> bool: View Source

314    def is_opened(self) -> bool:
315        """
316        Method to get status of the underlying pipe to ffmpeg.
317
318        Returns
319        ----------
320        bool
321            True if pipe is opened (reading or writing mode), False if not.
322        """
323        # is the pip opened?
324        if self.pipe is not None and self.pipe.poll() is None:
325            return True
326
327        return False

Method to get status of the underlying pipe to ffmpeg.

Returns

bool True if pipe is opened (reading or writing mode), False if not.

def readFrame(self, with_timestamps=False): View Source

549    def read_frame(self, with_timestamps = False):
550        """
551        Read next frame from the audio file
552
553        Parameters
554        ----------
555        with_timestamps: bool optional (default False)
556            If set to True, the method returns a ``FrameContainer`` with the audio and an array containing the associated timestamp(s)
557
558        Returns
559        ----------
560        nparray or FrameContainer
561            A frame of shape (self.channels,self.frame_size) as defined in the reader/open call if self.plannar is True. A frame
562            of shape (self.channels*self.frame_size) with interleaved data if self.plannar is False.
563            if with_timestamps is True, the return object is a FrameContainer with the audio data in ``FrameContainer.data`` and
564            the associated timestamp in ``FrameContainer.timestamps`` as an array (one element).
565        """
566
567        if self.pipe is None:
568            raise self.AudioIOException("No pipe opened to {}. Call open(...) before reading a frame.".format(self.audioProgram))
569        # - pipe is in write mode
570        if self.mode != PipeMode.READ_MODE:
571            raise self.AudioIOException("Pipe to {} for '{}' not opened in read mode.".format(self.audioProgram, self.filename))
572
573        if with_timestamps:
574            # get elapsed time in video, it is time of next frame(s)
575            current_elapsed_time = self.get_elapsed_time()
576
577        # read rgb image from pipe
578        toread = self.frame_size*4
579        buffer = self.pipe.stdout.read(toread)
580        if len(buffer) != toread:
581            # not considered as an error, no more frame, no exception
582            return None
583
584        # get numpy UINT8 array from buffer
585        audio = np.frombuffer(buffer, dtype = np.float32).reshape(self.frame_size, self.channels)
586
587        # make it plannar (or not)
588        if self.plannar:
589            #transpose it
590            audio = audio.T
591
592        # increase frame_counter
593        self.frame_counter.frame_count += (self.frame_size * self.channels)
594
595        # say to gc that this buffer is no longer needed
596        del buffer
597
598        if with_timestamps:
599            return FrameContainer(1, audio, self.frame_size/self.sample_rate, current_elapsed_time)
600        
601        return audio

Parameters

with_timestamps: bool optional (default False) If set to True, the method returns a FrameContainer with the audio and an array containing the associated timestamp(s)

Returns

nparray or FrameContainer A frame of shape (self.channels,self.frame_size) as defined in the reader/open call if self.plannar is True. A frame of shape (self.channels*self.frame_size) with interleaved data if self.plannar is False. if with_timestamps is True, the return object is a FrameContainer with the audio data in FrameContainer.data and the associated timestamp in FrameContainer.timestamps as an array (one element).

def readBatch(self, numberOfFrames, with_timestamps=False): View Source

603    def read_batch(self, numberOfFrames, with_timestamps = False):
604        """
605        Read next batch of audio from the file
606
607        Parameters
608        ----------
609        number_of_frames: int
610            Number of desired images within the batch. The last batch from the file may have less images.
611            
612        with_timestamps: bool optional (default False)
613            If set to True, the method returns a FrameContainer with the batch and the an array containing the associated timestamps to frames
614
615        Returns
616        ----------
617        nparray or FrameContainer
618            A batch of shape (n, self.channels,self.frame_size) as defined in the reader/open call if self.plannar is True. A batch
619            of shape (n, self.channels*self.frame_size) with interleaved data if self.plannar is False.
620            if with_timestamps is True, the return object is a FrameContainer with the audio batch in ``FrameContainer.data`` and
621            the associated timestamp in ``FrameContainer.timestamps`` as an array (one element for each audio frame).
622        """
623
624        if self.pipe is None:
625            raise self.AudioIOException("No pipe opened to {}. Call open(...) before reading frames.".format(self.audioProgram))
626        # - pipe is in write mode
627        if self.mode != PipeMode.READ_MODE:
628            raise self.AudioIOException("Pipe to {} for '{}' not opened in read mode.".format(self.audioProgram, self.filename))
629
630        if with_timestamps:
631            # get elapsed time in video, it is time of next frame(s)
632            current_elapsed_time = self.get_elapsed_time()
633
634        # try to read complete batch
635        toread = self.frame_size*4*self.channels*numberOfFrames
636        buffer = self.pipe.stdout.read(toread)
637
638        # check if we have at least 1 Frame
639        if len(buffer) < toread:
640            # not considered as an error, no more frame, no exception
641            return None
642
643        # compute actual number of Frames
644        actualNbFrames = len(buffer)//(self.frame_size*4*self.channels)
645
646        # get and reshape batch from buffer
647        batch = np.frombuffer(buffer, dtype = np.float32).reshape((actualNbFrames, self.frame_size, self.channels,))
648
649        if self.plannar:
650            batch = batch.transpose(0, 2, 1)
651
652        # increase frame_counter
653        self.frame_counter.frame_count += (actualNbFrames * self.frame_size * self.channels)
654        
655        # say to gc that this buffer is no longer needed
656        del buffer
657
658        if with_timestamps:
659            return FrameContainer( actualNbFrames, batch, self.frame_size/self.sample_rate, current_elapsed_time)
660        
661        return batch

Parameters

number_of_frames: int Number of desired images within the batch. The last batch from the file may have less images.

with_timestamps: bool optional (default False) If set to True, the method returns a FrameContainer with the batch and the an array containing the associated timestamps to frames

Returns

nparray or FrameContainer A batch of shape (n, self.channels,self.frame_size) as defined in the reader/open call if self.plannar is True. A batch of shape (n, self.channels*self.frame_size) with interleaved data if self.plannar is False. if with_timestamps is True, the return object is a FrameContainer with the audio batch in FrameContainer.data and the associated timestamp in FrameContainer.timestamps as an array (one element for each audio frame).

def writeFrame(self, audio) -> bool: View Source

663    def write_frame(self, audio) -> bool:
664        """
665        Write an audio frame to the file
666
667        Parameters
668        ----------
669        audio: nparray
670            The audio frame to write to the video file of shape (self.channels,nb_samples_per_channel) if plannar is True else (self.channels*nb_samples_per_channel).
671
672        Returns
673        ----------
674        bool
675            Writing was successful or not.
676        """
677        # Check params
678        # - pipe exists
679        if self.pipe is None:
680            raise self.AudioIOException("No pipe opened to {}. Call create(...) before writing frames.".format(self.audioProgram))
681        # - pipe is in write mode
682        if self.mode != PipeMode.WRITE_MODE:
683            raise self.AudioIOException("Pipe to {} for '{}' not opened in write mode.".format(self.audioProgram, self.filename))
684        # - shape of image is fine, thus we have pixels for a full compatible frame
685        if audio.shape[0] != self.channels:
686            raise self.AudioIOException("Wong audio shape: {} expected ({},{}).".format(audio.shape,self.channels,self.frame_size))
687        # - type of data is Float32
688        if audio.dtype != np.float32:
689            raise self.AudioIOException("Wong audio type: {} expected np.float32.".format(audio.dtype))
690
691        # array must have a shape (channels, samples), reshape it it to (samples, channels) if plannar
692        if not self.plannar:
693            audio = audio.reshape(-1)
694
695        # print( audio.shape )
696
697        # garantee to have a C continuous array
698        if not audio.flags['C_CONTIGUOUS']:
699            a = np.ascontiguousarray(a) 
700
701        # write frame
702        buffer = audio.tobytes()
703        if self.pipe.stdin.write( buffer ) < len(buffer):
704            print( f"Error writing frame to {self.filename}" )
705            return False
706
707        # increase frame_counter
708        self.frame_counter.frame_count += (self.frame_size * self.channels)
709
710        # say to gc that this buffer is no longer needed 
711        del buffer
712
713        return True

Write an audio frame to the file

Parameters

audio: nparray The audio frame to write to the video file of shape (self.channels,nb_samples_per_channel) if plannar is True else (self.channels*nb_samples_per_channel).

Returns

bool Writing was successful or not.

def writeBatch(self, batch): View Source

715    def write_batch(self, batch):
716        """
717        Write a batch of audio frame to the file
718
719        Parameters
720        ----------
721        batch: nparray
722            The batch of audio frames to write to the video file of shape (n,self.channels,nb_samples_per_channel) if plannar is True else (n,self.channels*nb_samples_per_channel) of interleaved audio data.
723
724        Returns
725        ----------
726        bool
727            Writing was successful or not.
728        """
729        # Check params
730        # - pipe exists
731        if self.pipe is None:
732            raise self.AudioIOException("No pipe opened to {}. Call create(...) before writing frames.".format(self.audioProgram))
733        # - pipe is in write mode
734        if self.mode != PipeMode.WRITE_MODE:
735            raise self.AudioIOException("Pipe to {} for '{}' not opened in write mode.".format(self.audioProgram, self.filename))
736        # batch is 3D (n, channels, nb samples)
737        if batch.ndim !=3:
738            raise self.AudioIOException("Wrong batch shape: {} expected 3 dimensions (n, n_channels, n_samples_per_channel).".format(batch.shape))
739        # - shape of images in batch is fine
740        if batch.shape[2] != self.channels:
741            raise self.AudioIOException("Wrong audio channels in batch: {} expected {} {}.".format(batch.shape[2], self.channels, batch.shape))
742
743        # array must have a shape (n * n_channels * n_samples_per_channel) before writing them to pipe
744        # reshape it it to (n * n_channels * n_samples_per_channel) if plannar is False
745        if not self.plannar:
746            # goes from (n, n_channels, n_samples_per_channel) to (n * n_channels * n_samples_per_channel)
747            batch = batch.transpose(0, 2, 1) # first go to (n, n_samples_per_channel, n_channels)
748            batch = batch.reshape(-1) # then to 1D array (n * n_channels * n_samples_per_channel)
749
750        # garantee to have a C continuous array
751        if not batch.flags['C_CONTIGUOUS']:
752            batch = np.ascontiguousarray(batch)
753
754        # write frame
755        buffer = batch.tobytes()
756        if self.pipe.stdin.write( buffer ) < len(buffer):
757            # say to gc that this buffer is no longer needed
758            del buffer
759            raise self.AudioIOException("Error writing batch to '{}'.".format(self.filename))
760
761        # increase frame_counter
762        self.frame_counter.frame_count += int(batch.shape[0]/self.channels) # int conversion is mandatory to avoid confusion with time as float
763              
764        # say to gc that this buffer is no longer needed
765        del buffer
766
767        return True

Write a batch of audio frame to the file

Parameters

batch: nparray The batch of audio frames to write to the video file of shape (n,self.channels,nb_samples_per_channel) if plannar is True else (n,self.channels*nb_samples_per_channel) of interleaved audio data.

Returns

bool Writing was successful or not.

audioProgram = '/usr/local/lib/python3.12/site-packages/static_ffmpeg/bin/linux/ffmpeg'

paramProgram = '/usr/local/lib/python3.12/site-packages/static_ffmpeg/bin/linux/ffprobe'

simple_ffmpeg_batch_io.AudioIO

Authors

Parameters

Parameters

Returns

Parameters

Returns

Returns

Returns

Returns

Returns

Parameters

Returns

Parameters

Returns

Parameters

Returns

Parameters

Returns

Parameters

Returns

Parameters

Returns

Parameters

Returns

Parameters

Parameters

Returns

Parameters

Returns

Parameters

Returns

Parameters

Returns

Returns

Parameters

Returns

Parameters

Returns

Parameters

Returns

Parameters

Returns