aboutsummaryrefslogtreecommitdiff
path: root/src/c2enc.c
diff options
context:
space:
mode:
authorAuthor Name <[email protected]>2023-07-07 12:20:59 +0930
committerDavid Rowe <[email protected]>2023-07-07 12:29:06 +0930
commitac7c48b4dee99d4c772f133d70d8d1b38262fcd2 (patch)
treea2d0ace57a9c0e2e5b611c4987f6fed1b38b81e7 /src/c2enc.c
shallow zip-file copy from codec2 e9d726bf20
Diffstat (limited to 'src/c2enc.c')
-rw-r--r--src/c2enc.c201
1 files changed, 201 insertions, 0 deletions
diff --git a/src/c2enc.c b/src/c2enc.c
new file mode 100644
index 0000000..f20fc46
--- /dev/null
+++ b/src/c2enc.c
@@ -0,0 +1,201 @@
+/*---------------------------------------------------------------------------*\
+
+ FILE........: c2enc.c
+ AUTHOR......: David Rowe
+ DATE CREATED: 23/8/2010
+
+ Encodes a file of raw speech samples using codec2 and outputs a file
+ of bits.
+
+\*---------------------------------------------------------------------------*/
+
+/*
+ Copyright (C) 2010 David Rowe
+
+ All rights reserved.
+
+ This program is free software; you can redistribute it and/or modify
+ it under the terms of the GNU Lesser General Public License version 2.1, as
+ published by the Free Software Foundation. This program is
+ distributed in the hope that it will be useful, but WITHOUT ANY
+ WARRANTY; without even the implied warranty of MERCHANTABILITY or
+ FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
+ License for more details.
+
+ You should have received a copy of the GNU Lesser General Public License
+ along with this program; if not, see <http://www.gnu.org/licenses/>.
+*/
+
+#include "codec2.h"
+#include "c2file.h"
+
+#include <stdio.h>
+#include <stdlib.h>
+#include <string.h>
+#include <errno.h>
+#include <math.h>
+
+int main(int argc, char *argv[])
+{
+ int mode;
+ void *codec2;
+ FILE *fin;
+ FILE *fout;
+ short *buf;
+ unsigned char *bits;
+ int nsam, nbit, nbyte, gray, softdec, bitperchar;
+ float *unpacked_bits_float;
+ char *unpacked_bits_char;
+ int bit, byte,i;
+ int report_var = 0;
+ int eq = 0;
+
+ if (argc < 4) {
+ printf("usage: c2enc 3200|2400|1600|1400|1300|1200|700C|450|450PWB InputRawspeechFile OutputBitFile [--natural] [--softdec] [--bitperchar] [--mlfeat f32File modelFile] [--loadcb stageNum Filename] [--var] [--eq]\n");
+ printf("e.g. (headerless) c2enc 1300 ../raw/hts1a.raw hts1a.bin\n");
+ printf("e.g. (with header to detect mode) c2enc 1300 ../raw/hts1a.raw hts1a.c2\n");
+ exit(1);
+ }
+
+ if (strcmp(argv[1],"3200") == 0)
+ mode = CODEC2_MODE_3200;
+ else if (strcmp(argv[1],"2400") == 0)
+ mode = CODEC2_MODE_2400;
+ else if (strcmp(argv[1],"1600") == 0)
+ mode = CODEC2_MODE_1600;
+ else if (strcmp(argv[1],"1400") == 0)
+ mode = CODEC2_MODE_1400;
+ else if (strcmp(argv[1],"1300") == 0)
+ mode = CODEC2_MODE_1300;
+ else if (strcmp(argv[1],"1200") == 0)
+ mode = CODEC2_MODE_1200;
+ else if (strcmp(argv[1],"700C") == 0)
+ mode = CODEC2_MODE_700C;
+ else if (strcmp(argv[1],"450") == 0)
+ mode = CODEC2_MODE_450;
+ else if (strcmp(argv[1],"450PWB") == 0)
+ mode = CODEC2_MODE_450;
+ else {
+ fprintf(stderr, "Error in mode: %s. Must be 3200, 2400, 1600, 1400, 1300, 1200, 700C, 450, 450PWB or WB\n", argv[1]);
+ exit(1);
+ }
+
+ if (strcmp(argv[2], "-") == 0) fin = stdin;
+ else if ( (fin = fopen(argv[2],"rb")) == NULL ) {
+ fprintf(stderr, "Error opening input speech file: %s: %s.\n",
+ argv[2], strerror(errno));
+ exit(1);
+ }
+
+ if (strcmp(argv[3], "-") == 0) fout = stdout;
+ else if ( (fout = fopen(argv[3],"wb")) == NULL ) {
+ fprintf(stderr, "Error opening output compressed bit file: %s: %s.\n",
+ argv[3], strerror(errno));
+ exit(1);
+ }
+
+ // Write a header if we're writing to a .c2 file
+ char *ext = strrchr(argv[3], '.');
+ if (ext != NULL) {
+ if (strcmp(ext, ".c2") == 0) {
+ struct c2_header out_hdr;
+ memcpy(out_hdr.magic,c2_file_magic,sizeof(c2_file_magic));
+ out_hdr.mode = mode;
+ out_hdr.version_major = CODEC2_VERSION_MAJOR;
+ out_hdr.version_minor = CODEC2_VERSION_MINOR;
+ // TODO: Handle flags (this block needs to be moved down)
+ out_hdr.flags = 0;
+ fwrite(&out_hdr,sizeof(out_hdr),1,fout);
+ };
+ };
+
+ codec2 = codec2_create(mode);
+ nsam = codec2_samples_per_frame(codec2);
+ nbit = codec2_bits_per_frame(codec2);
+ buf = (short*)malloc(nsam*sizeof(short));
+ nbyte = (nbit + 7) / 8;
+
+ bits = (unsigned char*)malloc(nbyte*sizeof(char));
+ unpacked_bits_float = (float*)malloc(nbit*sizeof(float));
+ unpacked_bits_char = (char*)malloc(nbit*sizeof(char));
+
+ gray = 1; softdec = 0; bitperchar = 0;
+ for (i=4; i<argc; i++) {
+ if (strcmp(argv[i], "--natural") == 0) {
+ gray = 0;
+ }
+ if (strcmp(argv[i], "--softdec") == 0) {
+ softdec = 1;
+ }
+ if (strcmp(argv[i], "--bitperchar") == 0) {
+ bitperchar = 1;
+ }
+ if (strcmp(argv[i], "--mlfeat") == 0) {
+ /* dump machine learning features (700C only) */
+ codec2_open_mlfeat(codec2, argv[i+1], argv[i+2]);
+ }
+ if (strcmp(argv[i], "--loadcb") == 0) {
+ /* load VQ stage (700C only) */
+ codec2_load_codebook(codec2, atoi(argv[i+1])-1, argv[i+2]);
+ }
+ if (strcmp(argv[i], "--var") == 0) {
+ report_var = 1;
+ }
+ if (strcmp(argv[i], "--eq") == 0) {
+ eq = 1;
+ }
+
+ }
+ codec2_set_natural_or_gray(codec2, gray);
+ codec2_700c_eq(codec2, eq);
+
+ //fprintf(stderr,"gray: %d softdec: %d\n", gray, softdec);
+
+ while(fread(buf, sizeof(short), nsam, fin) == (size_t)nsam) {
+
+ codec2_encode(codec2, bits, buf);
+
+ if (softdec || bitperchar) {
+ /* unpack bits, MSB first, send as soft decision float */
+
+ bit = 7; byte = 0;
+ for(i=0; i<nbit; i++) {
+ unpacked_bits_float[i] = 1.0 - 2.0*((bits[byte] >> bit) & 0x1);
+ unpacked_bits_char[i] = (bits[byte] >> bit) & 0x1;
+ bit--;
+ if (bit < 0) {
+ bit = 7;
+ byte++;
+ }
+ }
+ if (softdec) {
+ fwrite(unpacked_bits_float, sizeof(float), nbit, fout);
+ }
+ if (bitperchar) {
+ fwrite(unpacked_bits_char, sizeof(char), nbit, fout);
+ }
+ }
+ else
+ fwrite(bits, sizeof(char), nbyte, fout);
+
+ // if this is in a pipeline, we probably don't want the usual
+ // buffering to occur
+
+ if (fout == stdout) fflush(stdout);
+ }
+
+ if (report_var) {
+ float var = codec2_get_var(codec2);
+ fprintf(stderr, "%s var: %5.2f std: %5.2f\n", argv[2], var, sqrt(var));
+ }
+ codec2_destroy(codec2);
+
+ free(buf);
+ free(bits);
+ free(unpacked_bits_float);
+ free(unpacked_bits_char);
+ fclose(fin);
+ fclose(fout);
+
+ return 0;
+}