experimental 450 bit/s mode

author drowe67 <drowe67@01035d8c-6547-0410-b346-abe4f91aad63>

Wed, 1 Oct 2014 06:55:54 +0000 (06:55 +0000)

committer drowe67 <drowe67@01035d8c-6547-0410-b346-abe4f91aad63>

Wed, 1 Oct 2014 06:55:54 +0000 (06:55 +0000)
author drowe67 <drowe67@01035d8c-6547-0410-b346-abe4f91aad63>
Wed, 1 Oct 2014 06:55:54 +0000 (06:55 +0000)
committer drowe67 <drowe67@01035d8c-6547-0410-b346-abe4f91aad63>
Wed, 1 Oct 2014 06:55:54 +0000 (06:55 +0000)
diff --git a/codec2-dev/src/c2dec.c b/codec2-dev/src/c2dec.c

index 641e40198c6fc9c8d5076de3acb8c9d2800e6155..0c5103a7121a4c732b22b9e532b0121dc34935ce 100644 (file)
--- a/codec2-dev/src/c2dec.c
+++ b/codec2-dev/src/c2dec.c
@@ -88,8 +88,10 @@ int main(int argc, char *argv[])
         mode = CODEC2_MODE_1300;
      else if (strcmp(argv[1],"1200") == 0)
         mode = CODEC2_MODE_1200;
+    else if (strcmp(argv[1],"450") == 0)
+       mode = CODEC2_MODE_450;
      else {
-       fprintf(stderr, "Error in mode: %s.  Must be 3200, 2400, 1600, 1400, 1300 or 1200\n", argv[1]);
+       fprintf(stderr, "Error in mode: %s.  Must be 3200, 2400, 1600, 1400, 1300, 1200, or 450\n", argv[1]);
         exit(1);
      }
      bit_rate = atoi(argv[1]);
diff --git a/codec2-dev/src/c2enc.c b/codec2-dev/src/c2enc.c

index f0d9bca1e000886cb54a2c410009d6a3ee6450e2..a457a8f9602dec9be9647d2293a8993a0dfea1dc 100644 (file)
--- a/codec2-dev/src/c2enc.c
+++ b/codec2-dev/src/c2enc.c
@@ -44,7 +44,7 @@ int main(int argc, char *argv[])
      int            nsam, nbit, nbyte, gray;
   
      if (argc < 4) {
-       printf("usage: c2enc 3200|2400|1600|1400|1300|1200 InputRawspeechFile OutputBitFile [--natural]\n");
+       printf("usage: c2enc 3200|2400|1600|1400|1300|1200|450 InputRawspeechFile OutputBitFile [--natural]\n");
         printf("e.g    c2enc 1400 ../raw/hts1a.raw hts1a.c2\n");
         printf("e.g    c2enc 1300 ../raw/hts1a.raw hts1a.c2 --natural\n");
         exit(1);
@@ -62,8 +62,10 @@ int main(int argc, char *argv[])
         mode = CODEC2_MODE_1300;
      else if (strcmp(argv[1],"1200") == 0)
         mode = CODEC2_MODE_1200;
+    else if (strcmp(argv[1],"450") == 0)
+       mode = CODEC2_MODE_450;
      else {
-       fprintf(stderr, "Error in mode: %s.  Must be 3200, 2400, 1600, 1400, 1300 or 1200\n", argv[1]);
+       fprintf(stderr, "Error in mode: %s.  Must be 3200, 2400, 1600, 1400, 1300, 1200 or 450\n", argv[1]);
         exit(1);
      }
  
diff --git a/codec2-dev/src/c2sim.c b/codec2-dev/src/c2sim.c

index dc258ea1714c650d960ea67b8d930d7af6a2e9e7..5dc1f40021dff1a165595d85ef1042c0ac84eb1e 100644 (file)
--- a/codec2-dev/src/c2sim.c
+++ b/codec2-dev/src/c2sim.c
@@ -676,14 +676,14 @@ int main(int argc, char *argv[])
         
             if (scalar_quant_Wo_e) {
  
-               e = decode_energy(encode_energy(e));
+               e = decode_energy(encode_energy(e, E_BITS), E_BITS);
  
                 if (!decimate) {
                     /* we send params every 10ms, delta-time every 20ms */
                     if (dt && (frames % 2)) 
                         model.Wo = decode_Wo_dt(encode_Wo_dt(model.Wo, prev_Wo),prev_Wo);
                     else
-                       model.Wo = decode_Wo(encode_Wo(model.Wo));
+                       model.Wo = decode_Wo(encode_Wo(model.Wo, WO_BITS), WO_BITS);
                 }
  
                 if (decimate) {
@@ -693,7 +693,7 @@ int main(int argc, char *argv[])
                         model.Wo = decode_Wo_dt(encode_Wo_dt(model.Wo, prev__Wo),prev__Wo);
                     }
                     else
-                       model.Wo = decode_Wo(encode_Wo(model.Wo));                  
+                       model.Wo = decode_Wo(encode_Wo(model.Wo, WO_BITS), WO_BITS);                
                 }
  
                 model.L  = PI/model.Wo; /* if we quantise Wo re-compute L */
diff --git a/codec2-dev/src/codec2.c b/codec2-dev/src/codec2.c

index 60489e1cbe6970ff71bd933752689aad20a18d20..08604a55553ee054fd69e7badfdf1899fff5e8f7 100644 (file)
--- a/codec2-dev/src/codec2.c
+++ b/codec2-dev/src/codec2.c
@@ -67,6 +67,8 @@ void codec2_encode_1300(struct CODEC2 *c2, unsigned char * bits, short speech[])
  void codec2_decode_1300(struct CODEC2 *c2, short speech[], const unsigned char * bits, float ber_est);
  void codec2_encode_1200(struct CODEC2 *c2, unsigned char * bits, short speech[]);
  void codec2_decode_1200(struct CODEC2 *c2, short speech[], const unsigned char * bits);
+void codec2_encode_450(struct CODEC2 *c2, unsigned char * bits, short speech[]);
+void codec2_decode_450(struct CODEC2 *c2, short speech[], const unsigned char * bits);
  static void ear_protection(float in_out[], int n);
  
  /*---------------------------------------------------------------------------*\
@@ -104,7 +106,8 @@ struct CODEC2 * CODEC2_WIN32SUPPORT codec2_create(int mode)
            (mode == CODEC2_MODE_1600) || 
            (mode == CODEC2_MODE_1400) || 
            (mode == CODEC2_MODE_1300) || 
-          (mode == CODEC2_MODE_1200)
+          (mode == CODEC2_MODE_1200) ||
+          (mode == CODEC2_MODE_450) 
            );
      c2->mode = mode;
      for(i=0; i<M; i++)
@@ -192,6 +195,8 @@ int CODEC2_WIN32SUPPORT codec2_bits_per_frame(struct CODEC2 *c2) {
         return 52;
      if  (c2->mode == CODEC2_MODE_1200)
         return 48;
+    if  (c2->mode == CODEC2_MODE_450)
+       return 18;
  
      return 0; /* shouldn't get here */
  }
@@ -203,7 +208,7 @@ int CODEC2_WIN32SUPPORT codec2_bits_per_frame(struct CODEC2 *c2) {
    AUTHOR......: David Rowe                           
    DATE CREATED: Nov 14 2011
  
-  Returns the number of bits per frame.
+  Returns the number of speech samples per frame.
  
  \*---------------------------------------------------------------------------*/
  
@@ -220,6 +225,8 @@ int CODEC2_WIN32SUPPORT codec2_samples_per_frame(struct CODEC2 *c2) {
         return 320;
      if  (c2->mode == CODEC2_MODE_1200)
         return 320;
+    if  (c2->mode == CODEC2_MODE_450)
+       return 320;
  
      return 0; /* shouldnt get here */
  }
@@ -233,7 +240,8 @@ void CODEC2_WIN32SUPPORT codec2_encode(struct CODEC2 *c2, unsigned char *bits, s
            (c2->mode == CODEC2_MODE_1600) || 
            (c2->mode == CODEC2_MODE_1400) || 
            (c2->mode == CODEC2_MODE_1300) || 
-          (c2->mode == CODEC2_MODE_1200)
+          (c2->mode == CODEC2_MODE_1200) ||
+          (c2->mode == CODEC2_MODE_450)
            );
  
      if (c2->mode == CODEC2_MODE_3200)
@@ -248,6 +256,8 @@ void CODEC2_WIN32SUPPORT codec2_encode(struct CODEC2 *c2, unsigned char *bits, s
         codec2_encode_1300(c2, bits, speech);
      if (c2->mode == CODEC2_MODE_1200)
         codec2_encode_1200(c2, bits, speech);
+    if (c2->mode == CODEC2_MODE_450)
+       codec2_encode_450(c2, bits, speech);
  }
  
  void CODEC2_WIN32SUPPORT codec2_decode(struct CODEC2 *c2, short speech[], const unsigned char *bits)
@@ -264,7 +274,8 @@ void CODEC2_WIN32SUPPORT codec2_decode_ber(struct CODEC2 *c2, short speech[], co
            (c2->mode == CODEC2_MODE_1600) || 
            (c2->mode == CODEC2_MODE_1400) || 
            (c2->mode == CODEC2_MODE_1300) || 
-          (c2->mode == CODEC2_MODE_1200)
+          (c2->mode == CODEC2_MODE_1200) ||
+          (c2->mode == CODEC2_MODE_450)
            );
  
      if (c2->mode == CODEC2_MODE_3200)
@@ -279,6 +290,8 @@ void CODEC2_WIN32SUPPORT codec2_decode_ber(struct CODEC2 *c2, short speech[], co
         codec2_decode_1300(c2, speech, bits, ber_est);
      if (c2->mode == CODEC2_MODE_1200)
         codec2_decode_1200(c2, speech, bits);
+    if (c2->mode == CODEC2_MODE_450)
+       codec2_decode_450(c2, speech, bits);
  }
  
  
@@ -332,11 +345,11 @@ void codec2_encode_3200(struct CODEC2 *c2, unsigned char * bits, short speech[])
  
      analyse_one_frame(c2, &model, &speech[N]);
      pack(bits, &nbit, model.voiced, 1);
-    Wo_index = encode_Wo(model.Wo);
+    Wo_index = encode_Wo(model.Wo, WO_BITS);
      pack(bits, &nbit, Wo_index, WO_BITS);
     
      e = speech_to_uq_lsps(lsps, ak, c2->Sn, c2->w, LPC_ORD);
-    e_index = encode_energy(e);
+    e_index = encode_energy(e, E_BITS);
      pack(bits, &nbit, e_index, E_BITS);
  
      encode_lspds_scalar(lspd_indexes, lsps, LPC_ORD);
@@ -387,11 +400,11 @@ void codec2_decode_3200(struct CODEC2 *c2, short speech[], const unsigned char *
      model[1].voiced = unpack(bits, &nbit, 1);
  
      Wo_index = unpack(bits, &nbit, WO_BITS);
-    model[1].Wo = decode_Wo(Wo_index);
+    model[1].Wo = decode_Wo(Wo_index, WO_BITS);
      model[1].L  = PI/model[1].Wo;
  
      e_index = unpack(bits, &nbit, E_BITS);
-    e[1] = decode_energy(e_index);
+    e[1] = decode_energy(e_index, E_BITS);
  
      for(i=0; i<LSPD_SCALAR_INDEXES; i++) {
         lspd_indexes[i] = unpack(bits, &nbit, lspd_bits(i));
@@ -623,12 +636,12 @@ void codec2_encode_1600(struct CODEC2 *c2, unsigned char * bits, short speech[])
      analyse_one_frame(c2, &model, &speech[N]);
      pack(bits, &nbit, model.voiced, 1);
   
-    Wo_index = encode_Wo(model.Wo);
+    Wo_index = encode_Wo(model.Wo, WO_BITS);
      pack(bits, &nbit, Wo_index, WO_BITS);
  
      /* need to run this just to get LPC energy */
      e = speech_to_uq_lsps(lsps, ak, c2->Sn, c2->w, LPC_ORD);
-    e_index = encode_energy(e);
+    e_index = encode_energy(e, E_BITS);
      pack(bits, &nbit, e_index, E_BITS);
  
      /* frame 3: - voicing ---------------------------------------------*/
@@ -641,11 +654,11 @@ void codec2_encode_1600(struct CODEC2 *c2, unsigned char * bits, short speech[])
      analyse_one_frame(c2, &model, &speech[3*N]);
      pack(bits, &nbit, model.voiced, 1);
   
-    Wo_index = encode_Wo(model.Wo);
+    Wo_index = encode_Wo(model.Wo, WO_BITS);
      pack(bits, &nbit, Wo_index, WO_BITS);
  
      e = speech_to_uq_lsps(lsps, ak, c2->Sn, c2->w, LPC_ORD);
-    e_index = encode_energy(e);
+    e_index = encode_energy(e, E_BITS);
      pack(bits, &nbit, e_index, E_BITS);
   
      encode_lsps_scalar(lsp_indexes, lsps, LPC_ORD);
@@ -698,21 +711,21 @@ void codec2_decode_1600(struct CODEC2 *c2, short speech[], const unsigned char *
      
      model[1].voiced = unpack(bits, &nbit, 1);
      Wo_index = unpack(bits, &nbit, WO_BITS);
-    model[1].Wo = decode_Wo(Wo_index);
+    model[1].Wo = decode_Wo(Wo_index, WO_BITS);
      model[1].L  = PI/model[1].Wo;
  
      e_index = unpack(bits, &nbit, E_BITS);
-    e[1] = decode_energy(e_index);
+    e[1] = decode_energy(e_index, E_BITS);
  
      model[2].voiced = unpack(bits, &nbit, 1);
  
      model[3].voiced = unpack(bits, &nbit, 1);
      Wo_index = unpack(bits, &nbit, WO_BITS);
-    model[3].Wo = decode_Wo(Wo_index);
+    model[3].Wo = decode_Wo(Wo_index, WO_BITS);
      model[3].L  = PI/model[3].Wo;
  
      e_index = unpack(bits, &nbit, E_BITS);
-    e[3] = decode_energy(e_index);
+    e[3] = decode_energy(e_index, E_BITS);
   
      for(i=0; i<LSP_SCALAR_INDEXES; i++) {
         lsp_indexes[i] = unpack(bits, &nbit, lsp_bits(i));
@@ -990,14 +1003,14 @@ void codec2_encode_1300(struct CODEC2 *c2, unsigned char * bits, short speech[])
      analyse_one_frame(c2, &model, &speech[3*N]);
      pack_natural_or_gray(bits, &nbit, model.voiced, 1, c2->gray);
   
-    Wo_index = encode_Wo(model.Wo);
+    Wo_index = encode_Wo(model.Wo, WO_BITS);
      pack_natural_or_gray(bits, &nbit, Wo_index, WO_BITS, c2->gray);
  
      #ifdef PROFILE
      quant_start = machdep_profile_sample();
      #endif
      e = speech_to_uq_lsps(lsps, ak, c2->Sn, c2->w, LPC_ORD);
-    e_index = encode_energy(e);
+    e_index = encode_energy(e, E_BITS);
      pack_natural_or_gray(bits, &nbit, e_index, E_BITS, c2->gray);
   
      encode_lsps_scalar(lsp_indexes, lsps, LPC_ORD);
@@ -1056,11 +1069,11 @@ void codec2_decode_1300(struct CODEC2 *c2, short speech[], const unsigned char *
      model[3].voiced = unpack_natural_or_gray(bits, &nbit, 1, c2->gray);
  
      Wo_index = unpack_natural_or_gray(bits, &nbit, WO_BITS, c2->gray);
-    model[3].Wo = decode_Wo(Wo_index);
+    model[3].Wo = decode_Wo(Wo_index, WO_BITS);
      model[3].L  = PI/model[3].Wo;
  
      e_index = unpack_natural_or_gray(bits, &nbit, E_BITS, c2->gray);
-    e[3] = decode_energy(e_index);
+    e[3] = decode_energy(e_index, E_BITS);
   
      for(i=0; i<LSP_SCALAR_INDEXES; i++) {
         lsp_indexes[i] = unpack_natural_or_gray(bits, &nbit, lsp_bits(i), c2->gray);
@@ -1071,7 +1084,7 @@ void codec2_decode_1300(struct CODEC2 *c2, short speech[], const unsigned char *
   
      if (ber_est > 0.15) {
          model[0].voiced =  model[1].voiced = model[2].voiced = model[3].voiced = 0;
-        e[3] = decode_energy(10);
+        e[3] = decode_energy(10, E_BITS);
          bw_expand_lsps(&lsps[3][0], LPC_ORD, 200.0, 200.0);
          fprintf(stderr, "soft mute\n");
      }
@@ -1250,7 +1263,7 @@ void codec2_decode_1200(struct CODEC2 *c2, short speech[], const unsigned char *
      for(i=0; i<LSP_PRED_VQ_INDEXES; i++) {
         lsp_indexes[i] = unpack(bits, &nbit, lsp_pred_vq_bits(i));
      }
-    decode_lsps_vq(lsp_indexes, &lsps[3][0], LPC_ORD);
+    decode_lsps_vq(lsp_indexes, &lsps[3][0], LPC_ORD , 0);
      check_lsp_order(&lsps[3][0], LPC_ORD);
      bw_expand_lsps(&lsps[3][0], LPC_ORD, 50.0, 100.0);
   
@@ -1287,6 +1300,155 @@ void codec2_decode_1200(struct CODEC2 *c2, short speech[], const unsigned char *
  }
  
  
+/*---------------------------------------------------------------------------*\
+                                                       
+  FUNCTION....: codec2_encode_450           
+  AUTHOR......: David Rowe                           
+  DATE CREATED: Oct 1 2014
+
+  Encodes 320 speech samples (40ms of speech) into 18 bits.  
+
+  The codec2 algorithm actually operates internally on 10ms (80
+  sample) frames, so we run the encoding algorithm four times:
+
+  frame 0: nothing
+  frame 1: nothing
+  frame 2: nothing
+  frame 3: voicing bit, scalar Wo and E, 9 bit VQ of LSPs
+
+  The bit allocation is:
+
+    Parameter                      frames 1-3   frame 4   Total
+    -----------------------------------------------------------
+    Harmonic magnitudes (LSPs)          0          9         9
+    Energy                              0          3         3
+    log Wo                              0          5         5
+    Voicing                             0          1         1
+    TOTAL                               0         18        18
+ 
+\*---------------------------------------------------------------------------*/
+
+void codec2_encode_450(struct CODEC2 *c2, unsigned char * bits, short speech[])
+{
+    MODEL   model;
+    float   lsps[LPC_ORD];
+    float   lsps_[LPC_ORD];
+    float   ak[LPC_ORD+1];
+    float   e;
+    int     lsp_indexes[LPC_ORD];
+    int     Wo_index, e_index;
+    unsigned int nbit = 0;
+
+    assert(c2 != NULL);
+
+    memset(bits, '\0',  ((codec2_bits_per_frame(c2) + 7) / 8));
+
+    /* frame 1 --------------------------------------------------------*/
+
+    analyse_one_frame(c2, &model, speech);
+ 
+    /* frame 2 --------------------------------------------------------*/
+
+    analyse_one_frame(c2, &model, &speech[N]);
+ 
+    /* frame 3 --------------------------------------------------------*/
+
+    analyse_one_frame(c2, &model, &speech[2*N]);
+
+    /* frame 4: - voicing, scalar Wo & E, scalar LSPs -----------------*/
+
+    analyse_one_frame(c2, &model, &speech[3*N]);
+    pack(bits, &nbit, model.voiced, 1);
+    Wo_index = encode_log_Wo(model.Wo, 5);
+    pack_natural_or_gray(bits, &nbit, Wo_index, 5, c2->gray);
+
+    e = speech_to_uq_lsps(lsps, ak, c2->Sn, c2->w, LPC_ORD);
+    e_index = encode_energy(e, 3);
+    pack_natural_or_gray(bits, &nbit, e_index, 3, c2->gray);
+ 
+    encode_lsps_vq(lsp_indexes, lsps, lsps_, LPC_ORD);
+    pack(bits, &nbit, lsp_indexes[0], lsp_pred_vq_bits(0));
+  
+    assert(nbit == (unsigned)codec2_bits_per_frame(c2));
+}
+
+
+/*---------------------------------------------------------------------------*\
+                                                       
+  FUNCTION....: codec2_decode_450           
+  AUTHOR......: David Rowe                           
+  DATE CREATED: Oct 1 2014
+
+  Decodes frames of 18 bits into 320 samples (40ms) of speech.
+
+\*---------------------------------------------------------------------------*/
+
+void codec2_decode_450(struct CODEC2 *c2, short speech[], const unsigned char * bits)
+{
+    MODEL   model[4];
+    int     lsp_indexes[LPC_ORD];
+    float   lsps[4][LPC_ORD];
+    int     Wo_index, e_index;
+    float   e[4];
+    float   snr;
+    float   ak[4][LPC_ORD+1];
+    int     i,j;
+    unsigned int nbit = 0;
+    float   weight;
+    COMP    Aw[FFT_ENC];
+
+    assert(c2 != NULL);
+
+    /* only need to zero these out due to (unused) snr calculation */
+
+    for(i=0; i<4; i++)
+       for(j=1; j<=MAX_AMP; j++)
+           model[i].A[j] = 0.0;
+
+    /* unpack bits from channel ------------------------------------*/
+
+    model[3].voiced = unpack(bits, &nbit, 1);
+    model[0].voiced = model[1].voiced = model[2].voiced = model[3].voiced;
+
+    Wo_index = unpack_natural_or_gray(bits, &nbit, 5, c2->gray);
+    model[3].Wo = decode_log_Wo(Wo_index, 5);
+    model[3].L  = PI/model[3].Wo;
+
+    e_index = unpack_natural_or_gray(bits, &nbit, 3, c2->gray);
+    e[3] = decode_energy(e_index, 3);
+ 
+    lsp_indexes[0] = unpack(bits, &nbit, lsp_pred_vq_bits(0));
+    decode_lsps_vq(lsp_indexes, &lsps[3][0], LPC_ORD, 1);
+    check_lsp_order(&lsps[3][0], LPC_ORD);
+    bw_expand_lsps(&lsps[3][0], LPC_ORD, 50.0, 100.0);
+ 
+    /* interpolate ------------------------------------------------*/
+ 
+    /* LSPs, Wo, and energy are sampled every 40ms so we interpolate
+       the 3 frames in between, then recover spectral amplitudes */
+
+    for(i=0, weight=0.25; i<3; i++, weight += 0.25) {
+       interpolate_lsp_ver2(&lsps[i][0], c2->prev_lsps_dec, &lsps[3][0], weight);
+        interp_Wo2(&model[i], &c2->prev_model_dec, &model[3], weight);
+        e[i] = interp_energy2(c2->prev_e_dec, e[3],weight);
+    }
+    for(i=0; i<4; i++) {
+       lsp_to_lpc(&lsps[i][0], &ak[i][0], LPC_ORD);
+       aks_to_M2(c2->fft_fwd_cfg, &ak[i][0], LPC_ORD, &model[i], e[i], &snr, 0, 0,
+                  c2->lpc_pf, c2->bass_boost, c2->beta, c2->gamma, Aw); 
+       apply_lpc_correction(&model[i]);
+       synthesise_one_frame(c2, &speech[N*i], &model[i], Aw);
+    }
+
+    /* update memories for next frame ----------------------------*/
+
+    c2->prev_model_dec = model[3];
+    c2->prev_e_dec = e[3];
+    for(i=0; i<LPC_ORD; i++)
+       c2->prev_lsps_dec[i] = lsps[3][i];
+}
+
+
  /*---------------------------------------------------------------------------*\
                                                         
    FUNCTION....: synthesise_one_frame()      
diff --git a/codec2-dev/src/codec2.h b/codec2-dev/src/codec2.h

index ea007065092a55e5be28a3ca03afbec5d06d6ddf..ac888d7be13050da11c63b592586c9d6cfd0c1cd 100644 (file)
--- a/codec2-dev/src/codec2.h
+++ b/codec2-dev/src/codec2.h
@@ -52,6 +52,7 @@
  #define CODEC2_MODE_1400 3
  #define CODEC2_MODE_1300 4
  #define CODEC2_MODE_1200 5
+#define CODEC2_MODE_450  6
  
  struct CODEC2;
  
diff --git a/codec2-dev/src/freedv_api.c b/codec2-dev/src/freedv_api.c

index b5491cef9e9368843e8b9f2aa1ff73ee858cd471..c20f5709b4ec7e02a5abc22c95ee22652b75e61b 100644 (file)
--- a/codec2-dev/src/freedv_api.c
+++ b/codec2-dev/src/freedv_api.c
@@ -140,9 +140,10 @@ void freedv_close(struct freedv *freedv) {
    a frame of modem samples that can be sent to the transmitter.
  
    speech_in[] and mod_out[] are sampled at 8 kHz, 16 bit shorts, and
-  FREEDV_NSAMPLES long.  The speech_in[] level should be such that the
-  peak speech level is between +/16384 and +/- 32767.  mod_out[] will
-  be scaled such that the peak level is just less than +/-32767.
+  are always FREEDV_NSAMPLES long.  The speech_in[] level should be
+  such that the peak speech level is between +/16384 and +/- 32767.
+  mod_out[] will be scaled such that the peak level is just less than
+  +/-32767.
  
    The FDM modem signal mod_out[] has a high crest factor (around
    12dB), however the energy and duration of the peaks is small.
diff --git a/codec2-dev/src/quantise.c b/codec2-dev/src/quantise.c

index 23f2660e52208b396d4226860190d205a39863b4..acf2a1a5ba8fdb88cf0a1969e5dc98ce985fedec 100644 (file)
--- a/codec2-dev/src/quantise.c
+++ b/codec2-dev/src/quantise.c
@@ -1007,17 +1007,17 @@ void aks_to_M2(
  
  \*---------------------------------------------------------------------------*/
  
-int encode_Wo(float Wo)
+int encode_Wo(float Wo, int bits)
  {
-    int   index;
+    int   index, Wo_levels = 1<<bits;
      float Wo_min = TWO_PI/P_MAX;
      float Wo_max = TWO_PI/P_MIN;
      float norm;
  
      norm = (Wo - Wo_min)/(Wo_max - Wo_min);
-    index = floorf(WO_LEVELS * norm + 0.5);
+    index = floorf(Wo_levels * norm + 0.5);
      if (index < 0 ) index = 0;
-    if (index > (WO_LEVELS-1)) index = WO_LEVELS-1;
+    if (index > (Wo_levels-1)) index = Wo_levels-1;
  
      return index;
  }
@@ -1032,19 +1032,69 @@ int encode_Wo(float Wo)
  
  \*---------------------------------------------------------------------------*/
  
-float decode_Wo(int index)
+float decode_Wo(int index, int bits)
  {
      float Wo_min = TWO_PI/P_MAX;
      float Wo_max = TWO_PI/P_MIN;
      float step;
      float Wo;
+    int   Wo_levels = 1<<bits;
  
-    step = (Wo_max - Wo_min)/WO_LEVELS;
+    step = (Wo_max - Wo_min)/Wo_levels;
      Wo   = Wo_min + step*(index);
  
      return Wo;
  }
  
+/*---------------------------------------------------------------------------*\
+                                                       
+  FUNCTION....: encode_log_Wo()             
+  AUTHOR......: David Rowe                           
+  DATE CREATED: 22/8/2010 
+
+  Encodes Wo in the log domain using a WO_LEVELS quantiser.
+
+\*---------------------------------------------------------------------------*/
+
+int encode_log_Wo(float Wo, int bits)
+{
+    int   index, Wo_levels = 1<<bits;
+    float Wo_min = TWO_PI/P_MAX;
+    float Wo_max = TWO_PI/P_MIN;
+    float norm;
+
+    norm = (log10f(Wo) - log10f(Wo_min))/(log10f(Wo_max) - log10f(Wo_min));
+    index = floorf(Wo_levels * norm + 0.5);
+    if (index < 0 ) index = 0;
+    if (index > (Wo_levels-1)) index = Wo_levels-1;
+
+    return index;
+}
+
+/*---------------------------------------------------------------------------*\
+                                                       
+  FUNCTION....: decode_log_Wo()             
+  AUTHOR......: David Rowe                           
+  DATE CREATED: 22/8/2010 
+
+  Decodes Wo using a WO_LEVELS quantiser in the log domain.
+
+\*---------------------------------------------------------------------------*/
+
+float decode_log_Wo(int index, int bits)
+{
+    float Wo_min = TWO_PI/P_MAX;
+    float Wo_max = TWO_PI/P_MIN;
+    float step;
+    float Wo;
+    int   Wo_levels = 1<<bits;
+
+    step = (log10f(Wo_max) - log10f(Wo_min))/Wo_levels;
+    Wo   = log10f(Wo_min) + step*(index);
+
+    return powf(10,Wo);
+}
+
  /*---------------------------------------------------------------------------*\
                                                         
    FUNCTION....: encode_Wo_dt()      
@@ -1493,7 +1543,7 @@ void encode_lsps_vq(int *indexes, float *x, float *xq, int order)
  
  \*---------------------------------------------------------------------------*/
  
-void decode_lsps_vq(int *indexes, float *xq, int order)
+void decode_lsps_vq(int *indexes, float *xq, int order, int stages)
  {
    int i, n1, n2, n3;
    const float *codebook1 = lsp_cbjvm[0].cb;
@@ -1504,15 +1554,17 @@ void decode_lsps_vq(int *indexes, float *xq, int order)
    n2 = indexes[1];
    n3 = indexes[2];
  
-  for (i=0;i<order;i++)
-  {
-    xq[i] = codebook1[order*n1+i];
+  for (i=0;i<order;i++) {
+      xq[i] = codebook1[order*n1+i];
    }
-  for (i=0;i<order/2;i++)
-  {
-    xq[2*i] += codebook2[order*n2/2+i];
-    xq[2*i+1] += codebook3[order*n3/2+i];
+  
+  if (stages != 1) {
+      for (i=0;i<order/2;i++) {
+          xq[2*i] += codebook2[order*n2/2+i];
+          xq[2*i+1] += codebook3[order*n3/2+i];
+      }
    }
+  
  }
  
  
@@ -1675,18 +1727,18 @@ void apply_lpc_correction(MODEL *model)
  
  \*---------------------------------------------------------------------------*/
  
-int encode_energy(float e)
+int encode_energy(float e, int bits)
  {
-    int   index;
+    int   index, e_levels = 1<<bits;
      float e_min = E_MIN_DB;
      float e_max = E_MAX_DB;
      float norm;
  
      e = 10.0*log10f(e);
      norm = (e - e_min)/(e_max - e_min);
-    index = floorf(E_LEVELS * norm + 0.5);
+    index = floorf(e_levels * norm + 0.5);
      if (index < 0 ) index = 0;
-    if (index > (E_LEVELS-1)) index = E_LEVELS-1;
+    if (index > (e_levels-1)) index = e_levels-1;
  
      return index;
  }
@@ -1701,14 +1753,15 @@ int encode_energy(float e)
  
  \*---------------------------------------------------------------------------*/
  
-float decode_energy(int index)
+float decode_energy(int index, int bits)
  {
      float e_min = E_MIN_DB;
      float e_max = E_MAX_DB;
      float step;
      float e;
+    int   e_levels = 1<<bits;
  
-    step = (e_max - e_min)/E_LEVELS;
+    step = (e_max - e_min)/e_levels;
      e    = e_min + step*(index);
      e    = powf(10.0,e/10.0);
  
diff --git a/codec2-dev/src/quantise.h b/codec2-dev/src/quantise.h

index d714106793db884288270c6ababa84ed01d30845..f052635f6b7334ce0594b96b9d786bcfffee497c 100644 (file)
--- a/codec2-dev/src/quantise.h
+++ b/codec2-dev/src/quantise.h
@@ -60,8 +60,10 @@ void aks_to_M2(kiss_fft_cfg fft_fwd_cfg, float ak[], int order, MODEL *model,
                float E, float *snr, int dump, int sim_pf, 
                 int pf, int bass_boost, float beta, float gamma, COMP Aw[]);
  
-int   encode_Wo(float Wo);
-float decode_Wo(int index);
+int   encode_Wo(float Wo, int bits);
+float decode_Wo(int index, int bits);
+int   encode_log_Wo(float Wo, int bits);
+float decode_log_Wo(int index, int bits);
  int   encode_Wo_dt(float Wo, float prev_Wo);
  float decode_Wo_dt(int index, float prev_Wo);
  void  encode_lsps_scalar(int indexes[], float lsp[], int order);
@@ -80,7 +82,7 @@ void decode_lsps_diff_time(float lsp_[],
                            int order);
  
  void encode_lsps_vq(int *indexes, float *x, float *xq, int order);
-void decode_lsps_vq(int *indexes, float *xq, int order);
+void decode_lsps_vq(int *indexes, float *xq, int order, int stages);
  
  long quantise(const float * cb, float vec[], float w[], int k, int m, float *se);
  void lspvq_quantise(float lsp[], float lsp_[], int order); 
@@ -93,8 +95,8 @@ void quantise_WoE(MODEL *model, float *e, float xq[]);
  int  encode_WoE(MODEL *model, float e, float xq[]);
  void decode_WoE(MODEL *model, float *e, float xq[], int n1);
  
-int encode_energy(float e);
-float decode_energy(int index);
+int encode_energy(float e, int bits);
+float decode_energy(int index, int bits);
  
  void pack(unsigned char * bits, unsigned int *nbit, int index, unsigned int index_bits);
  void pack_natural_or_gray(unsigned char * bits, unsigned int *nbit, int index, unsigned int index_bits, unsigned int gray);
author	drowe67 <drowe67@01035d8c-6547-0410-b346-abe4f91aad63>
	Wed, 1 Oct 2014 06:55:54 +0000 (06:55 +0000)
committer	drowe67 <drowe67@01035d8c-6547-0410-b346-abe4f91aad63>
	Wed, 1 Oct 2014 06:55:54 +0000 (06:55 +0000)
codec2-dev/src/c2dec.c		patch \| blob \| history
codec2-dev/src/c2enc.c		patch \| blob \| history
codec2-dev/src/c2sim.c		patch \| blob \| history
codec2-dev/src/codec2.c		patch \| blob \| history
codec2-dev/src/codec2.h		patch \| blob \| history
codec2-dev/src/freedv_api.c		patch \| blob \| history
codec2-dev/src/quantise.c		patch \| blob \| history
codec2-dev/src/quantise.h		patch \| blob \| history