blob: fb446f9a90ed7cad67ba53e59261199afb2b9d7c [file] [log] [blame]
/* Copyright (c) 2023 Amazon
Written by Jan Buethe */
/*
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions
are met:
- Redistributions of source code must retain the above copyright
notice, this list of conditions and the following disclaimer.
- Redistributions in binary form must reproduce the above copyright
notice, this list of conditions and the following disclaimer in the
documentation and/or other materials provided with the distribution.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#ifdef HAVE_CONFIG_H
#include "config.h"
#endif
#include <math.h>
#include "osce.h"
#include "osce_features.h"
#include "os_support.h"
#include "nndsp.h"
#include "float_cast.h"
#include "arch.h"
#ifdef OSCE_DEBUG
#include <stdio.h>
/*#define WRITE_FEATURES*/
/*#define DEBUG_LACE*/
/*#define DEBUG_NOLACE*/
#define FINIT(fid, name, mode) do{if (fid == NULL) {fid = fopen(name, mode);}} while(0)
#endif
#ifdef ENABLE_OSCE_TRAINING_DATA
#include <stdio.h>
#endif
#define CLIP(a, min, max) (((a) < (min) ? (min) : (a)) > (max) ? (max) : (a))
extern const WeightArray lacelayers_arrays[];
extern const WeightArray nolacelayers_arrays[];
/* LACE */
#ifndef DISABLE_LACE
static void compute_lace_numbits_embedding(float *emb, float numbits, int dim, float min_val, float max_val, int logscale)
{
float x;
(void) dim;
numbits = logscale ? log(numbits) : numbits;
x = CLIP(numbits, min_val, max_val) - (max_val + min_val) / 2;
emb[0] = sin(x * LACE_NUMBITS_SCALE_0 - 0.5f);
emb[1] = sin(x * LACE_NUMBITS_SCALE_1 - 0.5f);
emb[2] = sin(x * LACE_NUMBITS_SCALE_2 - 0.5f);
emb[3] = sin(x * LACE_NUMBITS_SCALE_3 - 0.5f);
emb[4] = sin(x * LACE_NUMBITS_SCALE_4 - 0.5f);
emb[5] = sin(x * LACE_NUMBITS_SCALE_5 - 0.5f);
emb[6] = sin(x * LACE_NUMBITS_SCALE_6 - 0.5f);
emb[7] = sin(x * LACE_NUMBITS_SCALE_7 - 0.5f);
}
static int init_lace(LACE *hLACE, const WeightArray *weights)
{
int ret = 0;
OPUS_CLEAR(hLACE, 1);
celt_assert(weights != NULL);
ret = init_lacelayers(&hLACE->layers, weights);
compute_overlap_window(hLACE->window, LACE_OVERLAP_SIZE);
return ret;
}
static void reset_lace_state(LACEState *state)
{
OPUS_CLEAR(state, 1);
init_adacomb_state(&state->cf1_state);
init_adacomb_state(&state->cf2_state);
init_adaconv_state(&state->af1_state);
}
static void lace_feature_net(
LACE *hLACE,
LACEState *state,
float *output,
const float *features,
const float *numbits,
const int *periods,
int arch
)
{
float input_buffer[4 * IMAX(LACE_COND_DIM, LACE_HIDDEN_FEATURE_DIM)];
float output_buffer[4 * IMAX(LACE_COND_DIM, LACE_HIDDEN_FEATURE_DIM)];
float numbits_embedded[2 * LACE_NUMBITS_EMBEDDING_DIM];
int i_subframe;
compute_lace_numbits_embedding(numbits_embedded, numbits[0], LACE_NUMBITS_EMBEDDING_DIM,
log(LACE_NUMBITS_RANGE_LOW), log(LACE_NUMBITS_RANGE_HIGH), 1);
compute_lace_numbits_embedding(numbits_embedded + LACE_NUMBITS_EMBEDDING_DIM, numbits[1], LACE_NUMBITS_EMBEDDING_DIM,
log(LACE_NUMBITS_RANGE_LOW), log(LACE_NUMBITS_RANGE_HIGH), 1);
/* scaling and dimensionality reduction */
for (i_subframe = 0; i_subframe < 4; i_subframe ++)
{
OPUS_COPY(input_buffer, features + i_subframe * LACE_NUM_FEATURES, LACE_NUM_FEATURES);
OPUS_COPY(input_buffer + LACE_NUM_FEATURES, hLACE->layers.lace_pitch_embedding.float_weights + periods[i_subframe] * LACE_PITCH_EMBEDDING_DIM, LACE_PITCH_EMBEDDING_DIM);
OPUS_COPY(input_buffer + LACE_NUM_FEATURES + LACE_PITCH_EMBEDDING_DIM, numbits_embedded, 2 * LACE_NUMBITS_EMBEDDING_DIM);
compute_generic_conv1d(
&hLACE->layers.lace_fnet_conv1,
output_buffer + i_subframe * LACE_HIDDEN_FEATURE_DIM,
NULL,
input_buffer,
LACE_NUM_FEATURES + LACE_PITCH_EMBEDDING_DIM + 2 * LACE_NUMBITS_EMBEDDING_DIM,
ACTIVATION_TANH,
arch);
}
/* subframe accumulation */
OPUS_COPY(input_buffer, output_buffer, 4 * LACE_HIDDEN_FEATURE_DIM);
compute_generic_conv1d(
&hLACE->layers.lace_fnet_conv2,
output_buffer,
state->feature_net_conv2_state,
input_buffer,
4 * LACE_HIDDEN_FEATURE_DIM,
ACTIVATION_TANH,
arch
);
/* tconv upsampling */
OPUS_COPY(input_buffer, output_buffer, 4 * LACE_COND_DIM);
compute_generic_dense(
&hLACE->layers.lace_fnet_tconv,
output_buffer,
input_buffer,
ACTIVATION_TANH,
arch
);
/* GRU */
OPUS_COPY(input_buffer, output_buffer, 4 * LACE_COND_DIM);
for (i_subframe = 0; i_subframe < 4; i_subframe++)
{
compute_generic_gru(
&hLACE->layers.lace_fnet_gru_input,
&hLACE->layers.lace_fnet_gru_recurrent,
state->feature_net_gru_state,
input_buffer + i_subframe * LACE_COND_DIM,
arch
);
OPUS_COPY(output + i_subframe * LACE_COND_DIM, state->feature_net_gru_state, LACE_COND_DIM);
}
}
static void lace_process_20ms_frame(
LACE* hLACE,
LACEState *state,
float *x_out,
const float *x_in,
const float *features,
const float *numbits,
const int *periods,
int arch
)
{
float feature_buffer[4 * LACE_COND_DIM];
float output_buffer[4 * LACE_FRAME_SIZE];
int i_subframe, i_sample;
#ifdef DEBUG_LACE
static FILE *f_features=NULL, *f_encfeatures=NULL, *f_xin=NULL, *f_xpreemph=NULL, *f_postcf1=NULL;
static FILE *f_postcf2=NULL, *f_postaf1=NULL, *f_xdeemph, *f_numbits, *f_periods;
FINIT(f_features, "debug/c_features.f32", "wb");
FINIT(f_encfeatures, "debug/c_encoded_features.f32", "wb");
FINIT(f_xin, "debug/c_x_in.f32", "wb");
FINIT(f_xpreemph, "debug/c_xpreemph.f32", "wb");
FINIT(f_xdeemph, "debug/c_xdeemph.f32", "wb");
FINIT(f_postcf1, "debug/c_post_cf1.f32", "wb");
FINIT(f_postcf2, "debug/c_post_cf2.f32", "wb");
FINIT(f_postaf1, "debug/c_post_af1.f32", "wb");
FINIT(f_numbits, "debug/c_numbits.f32", "wb");
FINIT(f_periods, "debug/c_periods.s32", "wb");
fwrite(x_in, sizeof(*x_in), 4 * LACE_FRAME_SIZE, f_xin);
fwrite(numbits, sizeof(*numbits), 2, f_numbits);
fwrite(periods, sizeof(*periods), 4, f_periods);
#endif
/* pre-emphasis */
for (i_sample = 0; i_sample < 4 * LACE_FRAME_SIZE; i_sample ++)
{
output_buffer[i_sample] = x_in[i_sample] - LACE_PREEMPH * state->preemph_mem;
state->preemph_mem = x_in[i_sample];
}
/* run feature encoder */
lace_feature_net(hLACE, state, feature_buffer, features, numbits, periods, arch);
#ifdef DEBUG_LACE
fwrite(features, sizeof(*features), 4 * LACE_NUM_FEATURES, f_features);
fwrite(feature_buffer, sizeof(*feature_buffer), 4 * LACE_COND_DIM, f_encfeatures);
fwrite(output_buffer, sizeof(float), 4 * LACE_FRAME_SIZE, f_xpreemph);
#endif
/* 1st comb filtering stage */
for (i_subframe = 0; i_subframe < 4; i_subframe++)
{
adacomb_process_frame(
&state->cf1_state,
output_buffer + i_subframe * LACE_FRAME_SIZE,
output_buffer + i_subframe * LACE_FRAME_SIZE,
feature_buffer + i_subframe * LACE_COND_DIM,
&hLACE->layers.lace_cf1_kernel,
&hLACE->layers.lace_cf1_gain,
&hLACE->layers.lace_cf1_global_gain,
periods[i_subframe],
LACE_COND_DIM,
LACE_FRAME_SIZE,
LACE_OVERLAP_SIZE,
LACE_CF1_KERNEL_SIZE,
LACE_CF1_LEFT_PADDING,
LACE_CF1_FILTER_GAIN_A,
LACE_CF1_FILTER_GAIN_B,
LACE_CF1_LOG_GAIN_LIMIT,
hLACE->window,
arch);
}
#ifdef DEBUG_LACE
fwrite(output_buffer, sizeof(float), 4 * LACE_FRAME_SIZE, f_postcf1);
#endif
/* 2nd comb filtering stage */
for (i_subframe = 0; i_subframe < 4; i_subframe++)
{
adacomb_process_frame(
&state->cf2_state,
output_buffer + i_subframe * LACE_FRAME_SIZE,
output_buffer + i_subframe * LACE_FRAME_SIZE,
feature_buffer + i_subframe * LACE_COND_DIM,
&hLACE->layers.lace_cf2_kernel,
&hLACE->layers.lace_cf2_gain,
&hLACE->layers.lace_cf2_global_gain,
periods[i_subframe],
LACE_COND_DIM,
LACE_FRAME_SIZE,
LACE_OVERLAP_SIZE,
LACE_CF2_KERNEL_SIZE,
LACE_CF2_LEFT_PADDING,
LACE_CF2_FILTER_GAIN_A,
LACE_CF2_FILTER_GAIN_B,
LACE_CF2_LOG_GAIN_LIMIT,
hLACE->window,
arch);
}
#ifdef DEBUG_LACE
fwrite(output_buffer, sizeof(float), 4 * LACE_FRAME_SIZE, f_postcf2);
#endif
/* final adaptive filtering stage */
for (i_subframe = 0; i_subframe < 4; i_subframe++)
{
adaconv_process_frame(
&state->af1_state,
output_buffer + i_subframe * LACE_FRAME_SIZE,
output_buffer + i_subframe * LACE_FRAME_SIZE,
feature_buffer + i_subframe * LACE_COND_DIM,
&hLACE->layers.lace_af1_kernel,
&hLACE->layers.lace_af1_gain,
LACE_COND_DIM,
LACE_FRAME_SIZE,
LACE_OVERLAP_SIZE,
LACE_AF1_IN_CHANNELS,
LACE_AF1_OUT_CHANNELS,
LACE_AF1_KERNEL_SIZE,
LACE_AF1_LEFT_PADDING,
LACE_AF1_FILTER_GAIN_A,
LACE_AF1_FILTER_GAIN_B,
LACE_AF1_SHAPE_GAIN,
hLACE->window,
arch);
}
#ifdef DEBUG_LACE
fwrite(output_buffer, sizeof(float), 4 * LACE_FRAME_SIZE, f_postaf1);
#endif
/* de-emphasis */
for (i_sample = 0; i_sample < 4 * LACE_FRAME_SIZE; i_sample ++)
{
x_out[i_sample] = output_buffer[i_sample] + LACE_PREEMPH * state->deemph_mem;
state->deemph_mem = x_out[i_sample];
}
#ifdef DEBUG_LACE
fwrite(x_out, sizeof(float), 4 * LACE_FRAME_SIZE, f_xdeemph);
#endif
}
#endif /* #ifndef DISABLE_LACE */
/* NoLACE */
#ifndef DISABLE_NOLACE
static void compute_nolace_numbits_embedding(float *emb, float numbits, int dim, float min_val, float max_val, int logscale)
{
float x;
(void) dim;
numbits = logscale ? log(numbits) : numbits;
x = CLIP(numbits, min_val, max_val) - (max_val + min_val) / 2;
emb[0] = sin(x * NOLACE_NUMBITS_SCALE_0 - 0.5f);
emb[1] = sin(x * NOLACE_NUMBITS_SCALE_1 - 0.5f);
emb[2] = sin(x * NOLACE_NUMBITS_SCALE_2 - 0.5f);
emb[3] = sin(x * NOLACE_NUMBITS_SCALE_3 - 0.5f);
emb[4] = sin(x * NOLACE_NUMBITS_SCALE_4 - 0.5f);
emb[5] = sin(x * NOLACE_NUMBITS_SCALE_5 - 0.5f);
emb[6] = sin(x * NOLACE_NUMBITS_SCALE_6 - 0.5f);
emb[7] = sin(x * NOLACE_NUMBITS_SCALE_7 - 0.5f);
}
static int init_nolace(NoLACE *hNoLACE, const WeightArray *weights)
{
int ret = 0;
OPUS_CLEAR(hNoLACE, 1);
celt_assert(weights != NULL);
ret = init_nolacelayers(&hNoLACE->layers, weights);
compute_overlap_window(hNoLACE->window, NOLACE_OVERLAP_SIZE);
return ret;
}
static void reset_nolace_state(NoLACEState *state)
{
OPUS_CLEAR(state, 1);
init_adacomb_state(&state->cf1_state);
init_adacomb_state(&state->cf2_state);
init_adaconv_state(&state->af1_state);
init_adaconv_state(&state->af2_state);
init_adaconv_state(&state->af3_state);
init_adaconv_state(&state->af4_state);
init_adashape_state(&state->tdshape1_state);
init_adashape_state(&state->tdshape2_state);
init_adashape_state(&state->tdshape3_state);
}
static void nolace_feature_net(
NoLACE *hNoLACE,
NoLACEState *state,
float *output,
const float *features,
const float *numbits,
const int *periods,
int arch
)
{
float input_buffer[4 * IMAX(NOLACE_COND_DIM, NOLACE_HIDDEN_FEATURE_DIM)];
float output_buffer[4 * IMAX(NOLACE_COND_DIM, NOLACE_HIDDEN_FEATURE_DIM)];
float numbits_embedded[2 * NOLACE_NUMBITS_EMBEDDING_DIM];
int i_subframe;
compute_nolace_numbits_embedding(numbits_embedded, numbits[0], NOLACE_NUMBITS_EMBEDDING_DIM,
log(NOLACE_NUMBITS_RANGE_LOW), log(NOLACE_NUMBITS_RANGE_HIGH), 1);
compute_nolace_numbits_embedding(numbits_embedded + NOLACE_NUMBITS_EMBEDDING_DIM, numbits[1], NOLACE_NUMBITS_EMBEDDING_DIM,
log(NOLACE_NUMBITS_RANGE_LOW), log(NOLACE_NUMBITS_RANGE_HIGH), 1);
/* scaling and dimensionality reduction */
for (i_subframe = 0; i_subframe < 4; i_subframe ++)
{
OPUS_COPY(input_buffer, features + i_subframe * NOLACE_NUM_FEATURES, NOLACE_NUM_FEATURES);
OPUS_COPY(input_buffer + NOLACE_NUM_FEATURES, hNoLACE->layers.nolace_pitch_embedding.float_weights + periods[i_subframe] * NOLACE_PITCH_EMBEDDING_DIM, NOLACE_PITCH_EMBEDDING_DIM);
OPUS_COPY(input_buffer + NOLACE_NUM_FEATURES + NOLACE_PITCH_EMBEDDING_DIM, numbits_embedded, 2 * NOLACE_NUMBITS_EMBEDDING_DIM);
compute_generic_conv1d(
&hNoLACE->layers.nolace_fnet_conv1,
output_buffer + i_subframe * NOLACE_HIDDEN_FEATURE_DIM,
NULL,
input_buffer,
NOLACE_NUM_FEATURES + NOLACE_PITCH_EMBEDDING_DIM + 2 * NOLACE_NUMBITS_EMBEDDING_DIM,
ACTIVATION_TANH,
arch);
}
/* subframe accumulation */
OPUS_COPY(input_buffer, output_buffer, 4 * NOLACE_HIDDEN_FEATURE_DIM);
compute_generic_conv1d(
&hNoLACE->layers.nolace_fnet_conv2,
output_buffer,
state->feature_net_conv2_state,
input_buffer,
4 * NOLACE_HIDDEN_FEATURE_DIM,
ACTIVATION_TANH,
arch
);
/* tconv upsampling */
OPUS_COPY(input_buffer, output_buffer, 4 * NOLACE_COND_DIM);
compute_generic_dense(
&hNoLACE->layers.nolace_fnet_tconv,
output_buffer,
input_buffer,
ACTIVATION_TANH,
arch
);
/* GRU */
OPUS_COPY(input_buffer, output_buffer, 4 * NOLACE_COND_DIM);
for (i_subframe = 0; i_subframe < 4; i_subframe++)
{
compute_generic_gru(
&hNoLACE->layers.nolace_fnet_gru_input,
&hNoLACE->layers.nolace_fnet_gru_recurrent,
state->feature_net_gru_state,
input_buffer + i_subframe * NOLACE_COND_DIM,
arch
);
OPUS_COPY(output + i_subframe * NOLACE_COND_DIM, state->feature_net_gru_state, NOLACE_COND_DIM);
}
}
static void nolace_process_20ms_frame(
NoLACE* hNoLACE,
NoLACEState *state,
float *x_out,
const float *x_in,
const float *features,
const float *numbits,
const int *periods,
int arch
)
{
float feature_buffer[4 * NOLACE_COND_DIM];
float feature_transform_buffer[4 * NOLACE_COND_DIM];
float x_buffer1[8 * NOLACE_FRAME_SIZE];
float x_buffer2[8 * NOLACE_FRAME_SIZE];
int i_subframe, i_sample;
NOLACELayers *layers = &hNoLACE->layers;
#ifdef DEBUG_NOLACE
static FILE *f_features=NULL, *f_encfeatures=NULL, *f_xin=NULL, *f_xpreemph=NULL, *f_postcf1=NULL;
static FILE *f_postcf2=NULL, *f_postaf1=NULL, *f_xdeemph, *f_numbits, *f_periods;
static FILE *f_ffpostcf1, *f_fpostcf2, *f_fpostaf1;
FINIT(f_features, "debug/c_features.f32", "wb");
FINIT(f_encfeatures, "debug/c_encoded_features.f32", "wb");
FINIT(f_xin, "debug/c_x_in.f32", "wb");
FINIT(f_xpreemph, "debug/c_xpreemph.f32", "wb");
FINIT(f_xdeemph, "debug/c_xdeemph.f32", "wb");
FINIT(f_postcf1, "debug/c_post_cf1.f32", "wb");
FINIT(f_postcf2, "debug/c_post_cf2.f32", "wb");
FINIT(f_postaf1, "debug/c_post_af1.f32", "wb");
FINIT(f_numbits, "debug/c_numbits.f32", "wb");
FINIT(f_periods, "debug/c_periods.s32", "wb");
fwrite(x_in, sizeof(*x_in), 4 * NOLACE_FRAME_SIZE, f_xin);
fwrite(numbits, sizeof(*numbits), 2, f_numbits);
fwrite(periods, sizeof(*periods), 4, f_periods);
#endif
/* pre-emphasis */
for (i_sample = 0; i_sample < 4 * NOLACE_FRAME_SIZE; i_sample ++)
{
x_buffer1[i_sample] = x_in[i_sample] - NOLACE_PREEMPH * state->preemph_mem;
state->preemph_mem = x_in[i_sample];
}
/* run feature encoder */
nolace_feature_net(hNoLACE, state, feature_buffer, features, numbits, periods, arch);
#ifdef DEBUG_NOLACE
fwrite(features, sizeof(*features), 4 * NOLACE_NUM_FEATURES, f_features);
fwrite(feature_buffer, sizeof(*feature_buffer), 4 * NOLACE_COND_DIM, f_encfeatures);
fwrite(output_buffer, sizeof(float), 4 * NOLACE_FRAME_SIZE, f_xpreemph);
#endif
/* 1st comb filtering stage */
for (i_subframe = 0; i_subframe < 4; i_subframe++)
{
/* modifies signal in place */
adacomb_process_frame(
&state->cf1_state,
x_buffer1 + i_subframe * NOLACE_FRAME_SIZE,
x_buffer1 + i_subframe * NOLACE_FRAME_SIZE,
feature_buffer + i_subframe * NOLACE_COND_DIM,
&hNoLACE->layers.nolace_cf1_kernel,
&hNoLACE->layers.nolace_cf1_gain,
&hNoLACE->layers.nolace_cf1_global_gain,
periods[i_subframe],
NOLACE_COND_DIM,
NOLACE_FRAME_SIZE,
NOLACE_OVERLAP_SIZE,
NOLACE_CF1_KERNEL_SIZE,
NOLACE_CF1_LEFT_PADDING,
NOLACE_CF1_FILTER_GAIN_A,
NOLACE_CF1_FILTER_GAIN_B,
NOLACE_CF1_LOG_GAIN_LIMIT,
hNoLACE->window,
arch);
compute_generic_conv1d(
&layers->nolace_post_cf1,
feature_transform_buffer + i_subframe * NOLACE_COND_DIM,
state->post_cf1_state,
feature_buffer + i_subframe * NOLACE_COND_DIM,
NOLACE_COND_DIM,
ACTIVATION_TANH,
arch);
}
/* update feature buffer */
OPUS_COPY(feature_buffer, feature_transform_buffer, 4 * NOLACE_COND_DIM);
#ifdef DEBUG_NOLACE
fwrite(x_buffer1, sizeof(float), 4 * NOLACE_FRAME_SIZE, f_postcf1);
#endif
/* 2nd comb filtering stage */
for (i_subframe = 0; i_subframe < 4; i_subframe++)
{
/* modifies signal in place */
adacomb_process_frame(
&state->cf2_state,
x_buffer1 + i_subframe * NOLACE_FRAME_SIZE,
x_buffer1 + i_subframe * NOLACE_FRAME_SIZE,
feature_buffer + i_subframe * NOLACE_COND_DIM,
&hNoLACE->layers.nolace_cf2_kernel,
&hNoLACE->layers.nolace_cf2_gain,
&hNoLACE->layers.nolace_cf2_global_gain,
periods[i_subframe],
NOLACE_COND_DIM,
NOLACE_FRAME_SIZE,
NOLACE_OVERLAP_SIZE,
NOLACE_CF2_KERNEL_SIZE,
NOLACE_CF2_LEFT_PADDING,
NOLACE_CF2_FILTER_GAIN_A,
NOLACE_CF2_FILTER_GAIN_B,
NOLACE_CF2_LOG_GAIN_LIMIT,
hNoLACE->window,
arch);
compute_generic_conv1d(
&layers->nolace_post_cf2,
feature_transform_buffer + i_subframe * NOLACE_COND_DIM,
state->post_cf2_state,
feature_buffer + i_subframe * NOLACE_COND_DIM,
NOLACE_COND_DIM,
ACTIVATION_TANH,
arch);
}
/* update feature buffer */
OPUS_COPY(feature_buffer, feature_transform_buffer, 4 * NOLACE_COND_DIM);
#ifdef DEBUG_NOLACE
fwrite(x_buffer1, sizeof(float), 4 * NOLACE_FRAME_SIZE, f_postcf2);
#endif
/* final adaptive filtering stage */
for (i_subframe = 0; i_subframe < 4; i_subframe++)
{
adaconv_process_frame(
&state->af1_state,
x_buffer2 + i_subframe * NOLACE_FRAME_SIZE * NOLACE_AF1_OUT_CHANNELS,
x_buffer1 + i_subframe * NOLACE_FRAME_SIZE,
feature_buffer + i_subframe * NOLACE_COND_DIM,
&hNoLACE->layers.nolace_af1_kernel,
&hNoLACE->layers.nolace_af1_gain,
NOLACE_COND_DIM,
NOLACE_FRAME_SIZE,
NOLACE_OVERLAP_SIZE,
NOLACE_AF1_IN_CHANNELS,
NOLACE_AF1_OUT_CHANNELS,
NOLACE_AF1_KERNEL_SIZE,
NOLACE_AF1_LEFT_PADDING,
NOLACE_AF1_FILTER_GAIN_A,
NOLACE_AF1_FILTER_GAIN_B,
NOLACE_AF1_SHAPE_GAIN,
hNoLACE->window,
arch);
compute_generic_conv1d(
&layers->nolace_post_af1,
feature_transform_buffer + i_subframe * NOLACE_COND_DIM,
state->post_af1_state,
feature_buffer + i_subframe * NOLACE_COND_DIM,
NOLACE_COND_DIM,
ACTIVATION_TANH,
arch);
}
/* update feature buffer */
OPUS_COPY(feature_buffer, feature_transform_buffer, 4 * NOLACE_COND_DIM);
#ifdef DEBUG_NOLACE
fwrite(x_buffer2, sizeof(float), 4 * NOLACE_FRAME_SIZE * NOLACE_AF1_OUT_CHANNELS, f_postaf1);
#endif
/* first shape-mix round */
for (i_subframe = 0; i_subframe < 4; i_subframe++)
{
celt_assert(NOLACE_AF1_OUT_CHANNELS == 2);
/* modifies second channel in place */
adashape_process_frame(
&state->tdshape1_state,
x_buffer2 + i_subframe * NOLACE_AF1_OUT_CHANNELS * NOLACE_FRAME_SIZE + NOLACE_FRAME_SIZE,
x_buffer2 + i_subframe * NOLACE_AF1_OUT_CHANNELS * NOLACE_FRAME_SIZE + NOLACE_FRAME_SIZE,
feature_buffer + i_subframe * NOLACE_COND_DIM,
&layers->nolace_tdshape1_alpha1_f,
&layers->nolace_tdshape1_alpha1_t,
&layers->nolace_tdshape1_alpha2,
NOLACE_TDSHAPE1_FEATURE_DIM,
NOLACE_TDSHAPE1_FRAME_SIZE,
NOLACE_TDSHAPE1_AVG_POOL_K,
arch
);
adaconv_process_frame(
&state->af2_state,
x_buffer1 + i_subframe * NOLACE_FRAME_SIZE * NOLACE_AF2_OUT_CHANNELS,
x_buffer2 + i_subframe * NOLACE_FRAME_SIZE * NOLACE_AF2_IN_CHANNELS,
feature_buffer + i_subframe * NOLACE_COND_DIM,
&hNoLACE->layers.nolace_af2_kernel,
&hNoLACE->layers.nolace_af2_gain,
NOLACE_COND_DIM,
NOLACE_FRAME_SIZE,
NOLACE_OVERLAP_SIZE,
NOLACE_AF2_IN_CHANNELS,
NOLACE_AF2_OUT_CHANNELS,
NOLACE_AF2_KERNEL_SIZE,
NOLACE_AF2_LEFT_PADDING,
NOLACE_AF2_FILTER_GAIN_A,
NOLACE_AF2_FILTER_GAIN_B,
NOLACE_AF2_SHAPE_GAIN,
hNoLACE->window,
arch);
compute_generic_conv1d(
&layers->nolace_post_af2,
feature_transform_buffer + i_subframe * NOLACE_COND_DIM,
state->post_af2_state,
feature_buffer + i_subframe * NOLACE_COND_DIM,
NOLACE_COND_DIM,
ACTIVATION_TANH,
arch);
}
/* update feature buffer */
OPUS_COPY(feature_buffer, feature_transform_buffer, 4 * NOLACE_COND_DIM);
#ifdef DEBUG_NOLACE
fwrite(x_buffer1, sizeof(float), 4 * NOLACE_FRAME_SIZE * NOLACE_AF2_OUT_CHANNELS, f_postaf2);
#endif
/* second shape-mix round */
for (i_subframe = 0; i_subframe < 4; i_subframe++)
{
celt_assert(NOLACE_AF2_OUT_CHANNELS == 2);
/* modifies second channel in place */
adashape_process_frame(
&state->tdshape2_state,
x_buffer1 + i_subframe * NOLACE_AF2_OUT_CHANNELS * NOLACE_FRAME_SIZE + NOLACE_FRAME_SIZE,
x_buffer1 + i_subframe * NOLACE_AF2_OUT_CHANNELS * NOLACE_FRAME_SIZE + NOLACE_FRAME_SIZE,
feature_buffer + i_subframe * NOLACE_COND_DIM,
&layers->nolace_tdshape2_alpha1_f,
&layers->nolace_tdshape2_alpha1_t,
&layers->nolace_tdshape2_alpha2,
NOLACE_TDSHAPE2_FEATURE_DIM,
NOLACE_TDSHAPE2_FRAME_SIZE,
NOLACE_TDSHAPE2_AVG_POOL_K,
arch
);
adaconv_process_frame(
&state->af3_state,
x_buffer2 + i_subframe * NOLACE_FRAME_SIZE * NOLACE_AF3_OUT_CHANNELS,
x_buffer1 + i_subframe * NOLACE_FRAME_SIZE * NOLACE_AF3_IN_CHANNELS,
feature_buffer + i_subframe * NOLACE_COND_DIM,
&hNoLACE->layers.nolace_af3_kernel,
&hNoLACE->layers.nolace_af3_gain,
NOLACE_COND_DIM,
NOLACE_FRAME_SIZE,
NOLACE_OVERLAP_SIZE,
NOLACE_AF3_IN_CHANNELS,
NOLACE_AF3_OUT_CHANNELS,
NOLACE_AF3_KERNEL_SIZE,
NOLACE_AF3_LEFT_PADDING,
NOLACE_AF3_FILTER_GAIN_A,
NOLACE_AF3_FILTER_GAIN_B,
NOLACE_AF3_SHAPE_GAIN,
hNoLACE->window,
arch);
compute_generic_conv1d(
&layers->nolace_post_af3,
feature_transform_buffer + i_subframe * NOLACE_COND_DIM,
state->post_af3_state,
feature_buffer + i_subframe * NOLACE_COND_DIM,
NOLACE_COND_DIM,
ACTIVATION_TANH,
arch);
}
/* update feature buffer */
OPUS_COPY(feature_buffer, feature_transform_buffer, 4 * NOLACE_COND_DIM);
/* third shape-mix round */
for (i_subframe = 0; i_subframe < 4; i_subframe++)
{
celt_assert(NOLACE_AF3_OUT_CHANNELS == 2);
/* modifies second channel in place */
adashape_process_frame(
&state->tdshape3_state,
x_buffer2 + i_subframe * NOLACE_AF3_OUT_CHANNELS * NOLACE_FRAME_SIZE + NOLACE_FRAME_SIZE,
x_buffer2 + i_subframe * NOLACE_AF3_OUT_CHANNELS * NOLACE_FRAME_SIZE + NOLACE_FRAME_SIZE,
feature_buffer + i_subframe * NOLACE_COND_DIM,
&layers->nolace_tdshape3_alpha1_f,
&layers->nolace_tdshape3_alpha1_t,
&layers->nolace_tdshape3_alpha2,
NOLACE_TDSHAPE3_FEATURE_DIM,
NOLACE_TDSHAPE3_FRAME_SIZE,
NOLACE_TDSHAPE3_AVG_POOL_K,
arch
);
adaconv_process_frame(
&state->af4_state,
x_buffer1 + i_subframe * NOLACE_FRAME_SIZE * NOLACE_AF4_OUT_CHANNELS,
x_buffer2 + i_subframe * NOLACE_FRAME_SIZE * NOLACE_AF4_IN_CHANNELS,
feature_buffer + i_subframe * NOLACE_COND_DIM,
&hNoLACE->layers.nolace_af4_kernel,
&hNoLACE->layers.nolace_af4_gain,
NOLACE_COND_DIM,
NOLACE_FRAME_SIZE,
NOLACE_OVERLAP_SIZE,
NOLACE_AF4_IN_CHANNELS,
NOLACE_AF4_OUT_CHANNELS,
NOLACE_AF4_KERNEL_SIZE,
NOLACE_AF4_LEFT_PADDING,
NOLACE_AF4_FILTER_GAIN_A,
NOLACE_AF4_FILTER_GAIN_B,
NOLACE_AF4_SHAPE_GAIN,
hNoLACE->window,
arch);
}
/* de-emphasis */
for (i_sample = 0; i_sample < 4 * NOLACE_FRAME_SIZE; i_sample ++)
{
x_out[i_sample] = x_buffer1[i_sample] + NOLACE_PREEMPH * state->deemph_mem;
state->deemph_mem = x_out[i_sample];
}
#ifdef DEBUG_NOLACE
fwrite(x_out, sizeof(float), 4 * NOLACE_FRAME_SIZE, f_xdeemph);
#endif
}
#endif /* #ifndef DISABLE_NOLACE */
/* API */
void osce_reset(silk_OSCE_struct *hOSCE, int method)
{
OSCEState *state = &hOSCE->state;
OPUS_CLEAR(&hOSCE->features, 1);
switch(method)
{
case OSCE_METHOD_NONE:
break;
#ifndef DISABLE_LACE
case OSCE_METHOD_LACE:
reset_lace_state(&state->lace);
break;
#endif
#ifndef DISABLE_NOLACE
case OSCE_METHOD_NOLACE:
reset_nolace_state(&state->nolace);
break;
#endif
default:
celt_assert(0 && "method not defined"); /* Question: return error code? */
}
hOSCE->method = method;
hOSCE->features.reset = 2;
}
#if 0
#include <stdio.h>
static void print_float_array(FILE *fid, const char *name, const float *array, int n)
{
int i;
for (i = 0; i < n; i++)
{
fprintf(fid, "%s[%d]: %f\n", name, i, array[i]);
}
}
static void print_int_array(FILE *fid, const char *name, const int *array, int n)
{
int i;
for (i = 0; i < n; i++)
{
fprintf(fid, "%s[%d]: %d\n", name, i, array[i]);
}
}
static void print_int8_array(FILE *fid, const char *name, const opus_int8 *array, int n)
{
int i;
for (i = 0; i < n; i++)
{
fprintf(fid, "%s[%d]: %d\n", name, i, array[i]);
}
}
static void print_linear_layer(FILE *fid, const char *name, LinearLayer *layer)
{
int i, n_in, n_out, n_total;
char tmp[256];
n_in = layer->nb_inputs;
n_out = layer->nb_outputs;
n_total = n_in * n_out;
fprintf(fid, "\nprinting layer %s...\n", name);
fprintf(fid, "%s.nb_inputs: %d\n%s.nb_outputs: %d\n", name, n_in, name, n_out);
if (layer->bias !=NULL){}
if (layer->subias !=NULL){}
if (layer->weights !=NULL){}
if (layer->float_weights !=NULL){}
if (layer->bias != NULL) {sprintf(tmp, "%s.bias", name); print_float_array(fid, tmp, layer->bias, n_out);}
if (layer->subias != NULL) {sprintf(tmp, "%s.subias", name); print_float_array(fid, tmp, layer->subias, n_out);}
if (layer->weights != NULL) {sprintf(tmp, "%s.weights", name); print_int8_array(fid, tmp, layer->weights, n_total);}
if (layer->float_weights != NULL) {sprintf(tmp, "%s.float_weights", name); print_float_array(fid, tmp, layer->float_weights, n_total);}
//if (layer->weights_idx != NULL) {sprintf(tmp, "%s.weights_idx", name); print_float_array(fid, tmp, layer->weights_idx, n_total);}
if (layer->diag != NULL) {sprintf(tmp, "%s.diag", name); print_float_array(fid, tmp, layer->diag, n_in);}
if (layer->scale != NULL) {sprintf(tmp, "%s.scale", name); print_float_array(fid, tmp, layer->scale, n_out);}
}
#endif
int osce_load_models(OSCEModel *model, const void *data, int len)
{
int ret = 0;
WeightArray *list;
if (data != NULL && len)
{
/* init from buffer */
parse_weights(&list, data, len);
#ifndef DISABLE_LACE
if (ret == 0) {ret = init_lace(&model->lace, list);}
#endif
#ifndef DISABLE_NOLACE
if (ret == 0) {ret = init_nolace(&model->nolace, list);}
#endif
free(list);
} else
{
#ifdef USE_WEIGHTS_FILE
return -1;
#else
#ifndef DISABLE_LACE
if (ret == 0) {ret = init_lace(&model->lace, lacelayers_arrays);}
#endif
#ifndef DISABLE_NOLACE
if (ret == 0) {ret = init_nolace(&model->nolace, nolacelayers_arrays);}
#endif
#endif /* USE_WEIGHTS_FILE */
}
ret = ret ? -1 : 0;
return ret;
}
void osce_enhance_frame(
OSCEModel *model, /* I OSCE model struct */
silk_decoder_state *psDec, /* I/O Decoder state */
silk_decoder_control *psDecCtrl, /* I Decoder control */
opus_int16 xq[], /* I/O Decoded speech */
opus_int32 num_bits, /* I Size of SILK payload in bits */
int arch /* I Run-time architecture */
)
{
float in_buffer[320];
float out_buffer[320];
float features[4 * OSCE_FEATURE_DIM];
float numbits[2];
int periods[4];
int i;
/* enhancement only implemented for 20 ms frame at 16kHz */
if (psDec->fs_kHz != 16 || psDec->nb_subfr != 4)
{
osce_reset(&psDec->osce, psDec->osce.method);
return;
}
osce_calculate_features(psDec, psDecCtrl, features, numbits, periods, xq, num_bits);
/* scale input */
for (i = 0; i < 320; i++)
{
in_buffer[i] = ((float) xq[i]) * (1.f/32768.f);
}
switch(psDec->osce.method)
{
case OSCE_METHOD_NONE:
OPUS_COPY(out_buffer, in_buffer, 320);
break;
#ifndef DISABLE_LACE
case OSCE_METHOD_LACE:
lace_process_20ms_frame(&model->lace, &psDec->osce.state.lace, out_buffer, in_buffer, features, numbits, periods, arch);
break;
#endif
#ifndef DISABLE_NOLACE
case OSCE_METHOD_NOLACE:
nolace_process_20ms_frame(&model->nolace, &psDec->osce.state.nolace, out_buffer, in_buffer, features, numbits, periods, arch);
break;
#endif
default:
celt_assert(0 && "method not defined");
}
#ifdef ENABLE_OSCE_TRAINING_DATA
int k;
static FILE *flpc = NULL;
static FILE *fgain = NULL;
static FILE *fltp = NULL;
static FILE *fperiod = NULL;
static FILE *fnoisy16k = NULL;
static FILE* f_numbits = NULL;
static FILE* f_numbits_smooth = NULL;
if (flpc == NULL) {flpc = fopen("features_lpc.f32", "wb");}
if (fgain == NULL) {fgain = fopen("features_gain.f32", "wb");}
if (fltp == NULL) {fltp = fopen("features_ltp.f32", "wb");}
if (fperiod == NULL) {fperiod = fopen("features_period.s16", "wb");}
if (fnoisy16k == NULL) {fnoisy16k = fopen("noisy_16k.s16", "wb");}
if(f_numbits == NULL) {f_numbits = fopen("features_num_bits.s32", "wb");}
if (f_numbits_smooth == NULL) {f_numbits_smooth = fopen("features_num_bits_smooth.f32", "wb");}
fwrite(&num_bits, sizeof(num_bits), 1, f_numbits);
fwrite(&(psDec->osce.features.numbits_smooth), sizeof(psDec->osce.features.numbits_smooth), 1, f_numbits_smooth);
for (k = 0; k < psDec->nb_subfr; k++)
{
float tmp;
int16_t itmp;
float lpc_buffer[16] = {0};
opus_int16 *A_Q12, *B_Q14;
(void) num_bits;
(void) arch;
/* gain */
tmp = (float) psDecCtrl->Gains_Q16[k] / (1UL << 16);
fwrite(&tmp, sizeof(tmp), 1, fgain);
/* LPC */
A_Q12 = psDecCtrl->PredCoef_Q12[ k >> 1 ];
for (i = 0; i < psDec->LPC_order; i++)
{
lpc_buffer[i] = (float) A_Q12[i] / (1U << 12);
}
fwrite(lpc_buffer, sizeof(lpc_buffer[0]), 16, flpc);
/* LTP */
B_Q14 = &psDecCtrl->LTPCoef_Q14[ k * LTP_ORDER ];
for (i = 0; i < 5; i++)
{
tmp = (float) B_Q14[i] / (1U << 14);
fwrite(&tmp, sizeof(tmp), 1, fltp);
}
/* periods */
itmp = psDec->indices.signalType == TYPE_VOICED ? psDecCtrl->pitchL[ k ] : 0;
fwrite(&itmp, sizeof(itmp), 1, fperiod);
}
fwrite(xq, psDec->nb_subfr * psDec->subfr_length, sizeof(xq[0]), fnoisy16k);
#endif
if (psDec->osce.features.reset > 1)
{
OPUS_COPY(out_buffer, in_buffer, 320);
psDec->osce.features.reset --;
}
else if (psDec->osce.features.reset)
{
osce_cross_fade_10ms(out_buffer, in_buffer, 320);
psDec->osce.features.reset = 0;
}
/* scale output */
for (i = 0; i < 320; i++)
{
float tmp = 32768.f * out_buffer[i];
if (tmp > 32767.f) tmp = 32767.f;
if (tmp < -32767.f) tmp = -32767.f;
xq[i] = float2int(tmp);
}
}
#if 0
#include <stdio.h>
void lace_feature_net_compare(
const char * prefix,
int num_frames,
LACE* hLACE
)
{
char in_feature_file[256];
char out_feature_file[256];
char numbits_file[256];
char periods_file[256];
char message[512];
int i_frame, i_feature;
float mse;
float in_features[4 * LACE_NUM_FEATURES];
float out_features[4 * LACE_COND_DIM];
float out_features2[4 * LACE_COND_DIM];
float numbits[2];
int periods[4];
init_lace(hLACE);
FILE *f_in_features, *f_out_features, *f_numbits, *f_periods;
strcpy(in_feature_file, prefix);
strcat(in_feature_file, "_in_features.f32");
f_in_features = fopen(in_feature_file, "rb");
if (f_in_features == NULL)
{
sprintf(message, "could not open file %s", in_feature_file);
perror(message);
exit(1);
}
strcpy(out_feature_file, prefix);
strcat(out_feature_file, "_out_features.f32");
f_out_features = fopen(out_feature_file, "rb");
if (f_out_features == NULL)
{
sprintf(message, "could not open file %s", out_feature_file);
perror(message);
exit(1);
}
strcpy(periods_file, prefix);
strcat(periods_file, "_periods.s32");
f_periods = fopen(periods_file, "rb");
if (f_periods == NULL)
{
sprintf(message, "could not open file %s", periods_file);
perror(message);
exit(1);
}
strcpy(numbits_file, prefix);
strcat(numbits_file, "_numbits.f32");
f_numbits = fopen(numbits_file, "rb");
if (f_numbits == NULL)
{
sprintf(message, "could not open file %s", numbits_file);
perror(message);
exit(1);
}
for (i_frame = 0; i_frame < num_frames; i_frame ++)
{
if(fread(in_features, sizeof(float), 4 * LACE_NUM_FEATURES, f_in_features) != 4 * LACE_NUM_FEATURES)
{
fprintf(stderr, "could not read frame %d from in_features\n", i_frame);
exit(1);
}
if(fread(out_features, sizeof(float), 4 * LACE_COND_DIM, f_out_features) != 4 * LACE_COND_DIM)
{
fprintf(stderr, "could not read frame %d from out_features\n", i_frame);
exit(1);
}
if(fread(periods, sizeof(int), 4, f_periods) != 4)
{
fprintf(stderr, "could not read frame %d from periods\n", i_frame);
exit(1);
}
if(fread(numbits, sizeof(float), 2, f_numbits) != 2)
{
fprintf(stderr, "could not read frame %d from numbits\n", i_frame);
exit(1);
}
lace_feature_net(hLACE, out_features2, in_features, numbits, periods);
float mse = 0;
for (int i = 0; i < 4 * LACE_COND_DIM; i ++)
{
mse += pow(out_features[i] - out_features2[i], 2);
}
mse /= (4 * LACE_COND_DIM);
printf("rmse: %f\n", sqrt(mse));
}
fclose(f_in_features);
fclose(f_out_features);
fclose(f_numbits);
fclose(f_periods);
}
void lace_demo(
char *prefix,
char *output
)
{
char feature_file[256];
char numbits_file[256];
char periods_file[256];
char x_in_file[256];
char message[512];
int i_frame;
float mse;
float features[4 * LACE_NUM_FEATURES];
float numbits[2];
int periods[4];
float x_in[4 * LACE_FRAME_SIZE];
int16_t x_out[4 * LACE_FRAME_SIZE];
float buffer[4 * LACE_FRAME_SIZE];
LACE hLACE;
int frame_counter = 0;
FILE *f_features, *f_numbits, *f_periods, *f_x_in, *f_x_out;
init_lace(&hLACE);
strcpy(feature_file, prefix);
strcat(feature_file, "_features.f32");
f_features = fopen(feature_file, "rb");
if (f_features == NULL)
{
sprintf(message, "could not open file %s", feature_file);
perror(message);
exit(1);
}
strcpy(x_in_file, prefix);
strcat(x_in_file, "_x_in.f32");
f_x_in = fopen(x_in_file, "rb");
if (f_x_in == NULL)
{
sprintf(message, "could not open file %s", x_in_file);
perror(message);
exit(1);
}
f_x_out = fopen(output, "wb");
if (f_x_out == NULL)
{
sprintf(message, "could not open file %s", output);
perror(message);
exit(1);
}
strcpy(periods_file, prefix);
strcat(periods_file, "_periods.s32");
f_periods = fopen(periods_file, "rb");
if (f_periods == NULL)
{
sprintf(message, "could not open file %s", periods_file);
perror(message);
exit(1);
}
strcpy(numbits_file, prefix);
strcat(numbits_file, "_numbits.f32");
f_numbits = fopen(numbits_file, "rb");
if (f_numbits == NULL)
{
sprintf(message, "could not open file %s", numbits_file);
perror(message);
exit(1);
}
printf("processing %s\n", prefix);
while (fread(x_in, sizeof(float), 4 * LACE_FRAME_SIZE, f_x_in) == 4 * LACE_FRAME_SIZE)
{
printf("\rframe: %d", frame_counter++);
if(fread(features, sizeof(float), 4 * LACE_NUM_FEATURES, f_features) != 4 * LACE_NUM_FEATURES)
{
fprintf(stderr, "could not read frame %d from features\n", i_frame);
exit(1);
}
if(fread(periods, sizeof(int), 4, f_periods) != 4)
{
fprintf(stderr, "could not read frame %d from periods\n", i_frame);
exit(1);
}
if(fread(numbits, sizeof(float), 2, f_numbits) != 2)
{
fprintf(stderr, "could not read frame %d from numbits\n", i_frame);
exit(1);
}
lace_process_20ms_frame(
&hLACE,
buffer,
x_in,
features,
numbits,
periods
);
for (int n=0; n < 4 * LACE_FRAME_SIZE; n ++)
{
float tmp = (1UL<<15) * buffer[n];
tmp = CLIP(tmp, -32768, 32767);
x_out[n] = (int16_t) round(tmp);
}
fwrite(x_out, sizeof(int16_t), 4 * LACE_FRAME_SIZE, f_x_out);
}
printf("\ndone!\n");
fclose(f_features);
fclose(f_numbits);
fclose(f_periods);
fclose(f_x_in);
fclose(f_x_out);
}
void nolace_demo(
char *prefix,
char *output
)
{
char feature_file[256];
char numbits_file[256];
char periods_file[256];
char x_in_file[256];
char message[512];
int i_frame;
float mse;
float features[4 * LACE_NUM_FEATURES];
float numbits[2];
int periods[4];
float x_in[4 * LACE_FRAME_SIZE];
int16_t x_out[4 * LACE_FRAME_SIZE];
float buffer[4 * LACE_FRAME_SIZE];
NoLACE hNoLACE;
int frame_counter = 0;
FILE *f_features, *f_numbits, *f_periods, *f_x_in, *f_x_out;
init_nolace(&hNoLACE);
strcpy(feature_file, prefix);
strcat(feature_file, "_features.f32");
f_features = fopen(feature_file, "rb");
if (f_features == NULL)
{
sprintf(message, "could not open file %s", feature_file);
perror(message);
exit(1);
}
strcpy(x_in_file, prefix);
strcat(x_in_file, "_x_in.f32");
f_x_in = fopen(x_in_file, "rb");
if (f_x_in == NULL)
{
sprintf(message, "could not open file %s", x_in_file);
perror(message);
exit(1);
}
f_x_out = fopen(output, "wb");
if (f_x_out == NULL)
{
sprintf(message, "could not open file %s", output);
perror(message);
exit(1);
}
strcpy(periods_file, prefix);
strcat(periods_file, "_periods.s32");
f_periods = fopen(periods_file, "rb");
if (f_periods == NULL)
{
sprintf(message, "could not open file %s", periods_file);
perror(message);
exit(1);
}
strcpy(numbits_file, prefix);
strcat(numbits_file, "_numbits.f32");
f_numbits = fopen(numbits_file, "rb");
if (f_numbits == NULL)
{
sprintf(message, "could not open file %s", numbits_file);
perror(message);
exit(1);
}
printf("processing %s\n", prefix);
while (fread(x_in, sizeof(float), 4 * LACE_FRAME_SIZE, f_x_in) == 4 * LACE_FRAME_SIZE)
{
printf("\rframe: %d", frame_counter++);
if(fread(features, sizeof(float), 4 * LACE_NUM_FEATURES, f_features) != 4 * LACE_NUM_FEATURES)
{
fprintf(stderr, "could not read frame %d from features\n", i_frame);
exit(1);
}
if(fread(periods, sizeof(int), 4, f_periods) != 4)
{
fprintf(stderr, "could not read frame %d from periods\n", i_frame);
exit(1);
}
if(fread(numbits, sizeof(float), 2, f_numbits) != 2)
{
fprintf(stderr, "could not read frame %d from numbits\n", i_frame);
exit(1);
}
nolace_process_20ms_frame(
&hNoLACE,
buffer,
x_in,
features,
numbits,
periods
);
for (int n=0; n < 4 * LACE_FRAME_SIZE; n ++)
{
float tmp = (1UL<<15) * buffer[n];
tmp = CLIP(tmp, -32768, 32767);
x_out[n] = (int16_t) round(tmp);
}
fwrite(x_out, sizeof(int16_t), 4 * LACE_FRAME_SIZE, f_x_out);
}
printf("\ndone!\n");
fclose(f_features);
fclose(f_numbits);
fclose(f_periods);
fclose(f_x_in);
fclose(f_x_out);
}
int main()
{
#if 0
LACE hLACE;
lace_feature_net_compare("testvec2/lace", 5, &hLACE);
lace_demo("testdata/test9", "out_lace_c_9kbps.pcm");
lace_demo("testdata/test6", "out_lace_c_6kbps.pcm");
#endif
nolace_demo("testdata/test9", "out_nolace_c_9kbps.pcm");
}
#endif
/*gcc -I ../include -I . -I ../silk -I ../celt osce.c nndsp.c lace_data.c nolace_data.c nnet.c parse_lpcnet_weights.c -lm -o lacetest*/