blob: 9e6ff1f9f706bb69715f00fc7679828c5e4ca189 [file] [log] [blame]
# SPDX-FileCopyrightText: Copyright 2021, 2023 Arm Limited and/or its affiliates <open-source-office@arm.com>
# SPDX-License-Identifier: Apache-2.0
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""
This script can be used with the noise reduction use case to save
the dumped noise reduced audio to a wav file.
Example use:
python rnnoise_dump_extractor.py --dump_file output.bin --output_dir ./denoised_wavs/
"""
import argparse
import struct
import typing
from os import path
import numpy as np
import soundfile as sf
def extract(
dump_file: typing.IO,
output_dir: str,
export_npy: bool
):
"""
Extract audio file from RNNoise output dump
@param dump_file: Audio dump file location
@param output_dir: Output direction
@param export_npy: Whether to export the audio as .npy
"""
while True:
filename_length = struct.unpack("i", dump_file.read(4))[0]
if filename_length == -1:
return
filename = struct \
.unpack(f"{filename_length}s", dump_file.read(filename_length))[0] \
.decode('ascii')
audio_clip_length = struct.unpack("I", dump_file.read(4))[0]
output_file_name = path.join(output_dir, f"denoised_{filename}")
audio_clip = dump_file.read(audio_clip_length)
with sf.SoundFile(output_file_name, 'w', channels=1, samplerate=48000, subtype="PCM_16",
endian="LITTLE") as wav_file:
wav_file.buffer_write(audio_clip, dtype='int16')
print(f"{output_file_name} written to disk")
if export_npy:
output_file_name += ".npy"
pack_format = f"{int(audio_clip_length / 2)}h"
npdata = np.array(struct.unpack(pack_format, audio_clip)).astype(np.int16)
np.save(output_file_name, npdata)
print(f"{output_file_name} written to disk")
def main(args):
"""
Run RNNoise audio dump extraction
@param args: Parsed args
"""
extract(args.dump_file, args.output_dir, args.export_npy)
parser = argparse.ArgumentParser()
parser.add_argument(
"--dump_file",
type=argparse.FileType('rb'),
help="Dump file with audio files to extract.",
required=True
)
parser.add_argument(
"--output_dir",
help="Output directory, Warning: Duplicated file names will be overwritten.",
required=True
)
parser.add_argument(
"--export_npy",
help="Export the audio buffer in NumPy format",
action="store_true"
)
parsed_args = parser.parse_args()
if __name__ == "__main__":
main(parsed_args)