ref: 2c9b8474549da0fea69d05cb7b8cfa3177cdba51
parent: 80751bad709ce33f892b2f8b34f1e62d20d73574
author: Jean-Marc Valin <jmvalin@amazon.com>
date: Tue Aug 17 14:17:25 EDT 2021
noise tuning, flip sign of speech signal
--- a/dnn/dump_data.c
+++ b/dnn/dump_data.c
@@ -244,6 +244,7 @@
if (training && ++gain_change_count > 2821) {
float tmp, tmp2;
speech_gain = pow(10., (-20+(rand()%40))/20.);
+ if (rand()&1) speech_gain = -speech_gain;
if (rand()%20==0) speech_gain *= .01;
if (rand()%100==0) speech_gain = 0;
gain_change_count = 0;
@@ -250,7 +251,7 @@
rand_resp(a_sig, b_sig);
tmp = (float)rand()/RAND_MAX;
tmp2 = (float)rand()/RAND_MAX;
- noise_std = -log(tmp)-log(tmp2);
+ noise_std = ABS16(-1.5*log(1e-4+tmp)-.5*log(1e-4+tmp2));
}
biquad(x, mem_hp_x, x, b_hp, a_hp, FRAME_SIZE);
biquad(x, mem_resp_x, x, b_sig, a_sig, FRAME_SIZE);
--- a/dnn/lpcnet_private.h
+++ b/dnn/lpcnet_private.h
@@ -1,6 +1,7 @@
#ifndef LPCNET_PRIVATE_H
#define LPCNET_PRIVATE_H
+#include <stdio.h>
#include "common.h"
#include "freq.h"
#include "lpcnet.h"
@@ -73,5 +74,7 @@
void compute_frame_features(LPCNetEncState *st, const float *in);
void decode_packet(float features[4][NB_TOTAL_FEATURES], float *vq_mem, const unsigned char buf[8]);
+
+void process_single_frame(LPCNetEncState *st, FILE *ffeat);
#endif
--
⑨