shithub: opus

Download patch

ref: 2c9b8474549da0fea69d05cb7b8cfa3177cdba51
parent: 80751bad709ce33f892b2f8b34f1e62d20d73574
author: Jean-Marc Valin <jmvalin@amazon.com>
date: Tue Aug 17 14:17:25 EDT 2021

noise tuning, flip sign of speech signal

--- a/dnn/dump_data.c
+++ b/dnn/dump_data.c
@@ -244,6 +244,7 @@
     if (training && ++gain_change_count > 2821) {
       float tmp, tmp2;
       speech_gain = pow(10., (-20+(rand()%40))/20.);
+      if (rand()&1) speech_gain = -speech_gain;
       if (rand()%20==0) speech_gain *= .01;
       if (rand()%100==0) speech_gain = 0;
       gain_change_count = 0;
@@ -250,7 +251,7 @@
       rand_resp(a_sig, b_sig);
       tmp = (float)rand()/RAND_MAX;
       tmp2 = (float)rand()/RAND_MAX;
-      noise_std = -log(tmp)-log(tmp2);
+      noise_std = ABS16(-1.5*log(1e-4+tmp)-.5*log(1e-4+tmp2));
     }
     biquad(x, mem_hp_x, x, b_hp, a_hp, FRAME_SIZE);
     biquad(x, mem_resp_x, x, b_sig, a_sig, FRAME_SIZE);
--- a/dnn/lpcnet_private.h
+++ b/dnn/lpcnet_private.h
@@ -1,6 +1,7 @@
 #ifndef LPCNET_PRIVATE_H
 #define LPCNET_PRIVATE_H
 
+#include <stdio.h>
 #include "common.h"
 #include "freq.h"
 #include "lpcnet.h"
@@ -73,5 +74,7 @@
 void compute_frame_features(LPCNetEncState *st, const float *in);
 
 void decode_packet(float features[4][NB_TOTAL_FEATURES], float *vq_mem, const unsigned char buf[8]);
+
+void process_single_frame(LPCNetEncState *st, FILE *ffeat);
 
 #endif
--