diff options
author | alexander <alexander.efremov@arm.com> | 2021-03-26 21:42:19 +0000 |
---|---|---|
committer | Kshitij Sisodia <kshitij.sisodia@arm.com> | 2021-03-29 16:29:55 +0100 |
commit | 3c79893217bc632c9b0efa815091bef3c779490c (patch) | |
tree | ad06b444557eb8124652b45621d736fa1b92f65d /scripts/py/gen_audio.py | |
parent | 6ad6d55715928de72979b04194da1bdf04a4c51b (diff) | |
download | ml-embedded-evaluation-kit-3c79893217bc632c9b0efa815091bef3c779490c.tar.gz |
Opensource ML embedded evaluation kit21.03
Change-Id: I12e807f19f5cacad7cef82572b6dd48252fd61fd
Diffstat (limited to 'scripts/py/gen_audio.py')
-rw-r--r-- | scripts/py/gen_audio.py | 48 |
1 files changed, 48 insertions, 0 deletions
diff --git a/scripts/py/gen_audio.py b/scripts/py/gen_audio.py new file mode 100644 index 0000000..53ed019 --- /dev/null +++ b/scripts/py/gen_audio.py @@ -0,0 +1,48 @@ +#!env/bin/python3 + +# Copyright (c) 2021 Arm Limited. All rights reserved. +# SPDX-License-Identifier: Apache-2.0 +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +""" +Utility script to convert an audio clip into eval platform desired spec. +""" +import soundfile as sf + +from argparse import ArgumentParser +from os import path + +from gen_utils import AudioUtils + +parser = ArgumentParser() +parser.add_argument("--audio_path", help="Audio file path", required=True) +parser.add_argument("--output_dir", help="Output directory", required=True) +parser.add_argument("--sampling_rate", type=int, help="target sampling rate.", default=16000) +parser.add_argument("--mono", type=bool, help="convert signal to mono.", default=True) +parser.add_argument("--offset", type=float, help="start reading after this time (in seconds).", default=0) +parser.add_argument("--duration", type=float, help="only load up to this much audio (in seconds).", default=0) +parser.add_argument("--res_type", type=AudioUtils.res_data_type, help=f"Resample type: {AudioUtils.res_type_list()}.", default='kaiser_best') +parser.add_argument("--min_samples", type=int, help="Minimum sample number.", default=16000) +parser.add_argument("-v", "--verbosity", action="store_true") +args = parser.parse_args() + +def main(args): + audio_data, samplerate = AudioUtils.load_resample_audio_clip(args.audio_path, + args.sampling_rate, + args.mono, args.offset, + args.duration, args.res_type, + args.min_samples) + sf.write(path.join(args.output_dir, path.basename(args.audio_path)), audio_data, samplerate) + +if __name__ == '__main__': + main(args) |