summaryrefslogtreecommitdiff
path: root/scripts/py/rnnoise_dump_extractor.py
blob: 715b9229e2caa447f55a0ea05b8f0f2a9e21ea15 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
#  SPDX-FileCopyrightText: Copyright 2021 Arm Limited and/or its affiliates <open-source-office@arm.com>
#  SPDX-License-Identifier: Apache-2.0
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
"""
This script can be used with the noise reduction use case to save
the dumped noise reduced audio to a wav file.

Example use:
python rnnoise_dump_extractor.py --dump_file output.bin --output_dir ./denoised_wavs/
"""

import soundfile as sf
import numpy as np

import argparse
from os import path
import struct


def extract(fp, output_dir, export_npy):
    while True:
        filename_length = struct.unpack("i", fp.read(4))[0]

        if filename_length == -1:
            return

        filename = struct.unpack("{}s".format(filename_length), fp.read(filename_length))[0].decode('ascii')
        audio_clip_length = struct.unpack("I", fp.read(4))[0]
        output_file_name = path.join(output_dir, "denoised_{}".format(filename))
        audio_clip = fp.read(audio_clip_length)
        
        with sf.SoundFile(output_file_name, 'w', channels=1, samplerate=48000, subtype="PCM_16", endian="LITTLE") as wav_file:
            wav_file.buffer_write(audio_clip, dtype='int16')
            print("{} written to disk".format(output_file_name))

        if export_npy:
            output_file_name += ".npy"
            pack_format = "{}h".format(int(audio_clip_length/2))
            npdata = np.array(struct.unpack(pack_format, audio_clip)).astype(np.int16)
            np.save(output_file_name, npdata)
            print("{} written to disk".format(output_file_name))


def main(args):
    extract(args.dump_file, args.output_dir, args.export_npy)


parser = argparse.ArgumentParser()
parser.add_argument("--dump_file", type=argparse.FileType('rb'), help="Dump file with audio files to extract.", required=True)
parser.add_argument("--output_dir", help="Output directory, Warning: Duplicated file names will be overwritten.", required=True)
parser.add_argument("--export_npy", help="Export the audio buffer in NumPy format", action="store_true")
args = parser.parse_args()

if __name__ == "__main__":
    main(args)