scripts/py/rnnoise_dump_extractor.py


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103

#  SPDX-FileCopyrightText:  Copyright 2021, 2023 Arm Limited and/or its affiliates <open-source-office@arm.com>
#  SPDX-License-Identifier: Apache-2.0
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
"""
This script can be used with the noise reduction use case to save
the dumped noise reduced audio to a wav file.

Example use:
python rnnoise_dump_extractor.py --dump_file output.bin --output_dir ./denoised_wavs/
"""

import argparse
import struct
import typing
from os import path

import numpy as np
import soundfile as sf


def extract(
        dump_file: typing.IO,
        output_dir: str,
        export_npy: bool
):
    """
    Extract audio file from RNNoise output dump

    @param dump_file:   Audio dump file location
    @param output_dir:  Output direction
    @param export_npy:  Whether to export the audio as .npy
    """
    while True:
        filename_length = struct.unpack("i", dump_file.read(4))[0]

        if filename_length == -1:
            return

        filename = struct \
            .unpack(f"{filename_length}s", dump_file.read(filename_length))[0] \
            .decode('ascii')

        audio_clip_length = struct.unpack("I", dump_file.read(4))[0]
        output_file_name = path.join(output_dir, f"denoised_{filename}")
        audio_clip = dump_file.read(audio_clip_length)

        with sf.SoundFile(output_file_name, 'w', channels=1, samplerate=48000, subtype="PCM_16",
                          endian="LITTLE") as wav_file:
            wav_file.buffer_write(audio_clip, dtype='int16')
            print(f"{output_file_name} written to disk")

        if export_npy:
            output_file_name += ".npy"
            pack_format = f"{int(audio_clip_length / 2)}h"
            npdata = np.array(struct.unpack(pack_format, audio_clip)).astype(np.int16)
            np.save(output_file_name, npdata)
            print(f"{output_file_name} written to disk")


def main(args):
    """
    Run RNNoise audio dump extraction
    @param args:    Parsed args
    """
    extract(args.dump_file, args.output_dir, args.export_npy)


parser = argparse.ArgumentParser()

parser.add_argument(
    "--dump_file",
    type=argparse.FileType('rb'),
    help="Dump file with audio files to extract.",
    required=True
)

parser.add_argument(
    "--output_dir",
    help="Output directory, Warning: Duplicated file names will be overwritten.",
    required=True
)

parser.add_argument(
    "--export_npy",
    help="Export the audio buffer in NumPy format",
    action="store_true"
)

parsed_args = parser.parse_args()

if __name__ == "__main__":
    main(parsed_args)