/*---------------------------------------------------------------------------*\ FILE........: c2enc.c AUTHOR......: David Rowe DATE CREATED: 23/8/2010 Encodes a file of raw speech samples using codec2 and outputs a file of bits. \*---------------------------------------------------------------------------*/ /* Copyright (C) 2010 David Rowe All rights reserved. This program is free software; you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License version 2.1, as published by the Free Software Foundation. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU Lesser General Public License along with this program; if not, see . */ #include #include #include #include #include #include "c2file.h" #include "codec2.h" int main(int argc, char *argv[]) { int mode; void *codec2; FILE *fin; FILE *fout; short *buf; unsigned char *bits; int nsam, nbit, nbyte, gray, softdec, bitperchar; float *unpacked_bits_float; char *unpacked_bits_char; int bit, byte, i; int report_var = 0; int eq = 0; if (argc < 4) { printf( "usage: c2enc 3200|2400|1600|1400|1300|1200|700C|450|450PWB " "InputRawspeechFile OutputBitFile [--natural] [--softdec] " "[--bitperchar] [--mlfeat f32File modelFile] [--loadcb stageNum " "Filename] [--var] [--eq]\n"); printf("e.g. (headerless) c2enc 1300 ../raw/hts1a.raw hts1a.bin\n"); printf( "e.g. (with header to detect mode) c2enc 1300 ../raw/hts1a.raw " "hts1a.c2\n"); exit(1); } if (strcmp(argv[1], "3200") == 0) mode = CODEC2_MODE_3200; else if (strcmp(argv[1], "2400") == 0) mode = CODEC2_MODE_2400; else if (strcmp(argv[1], "1600") == 0) mode = CODEC2_MODE_1600; else if (strcmp(argv[1], "1400") == 0) mode = CODEC2_MODE_1400; else if (strcmp(argv[1], "1300") == 0) mode = CODEC2_MODE_1300; else if (strcmp(argv[1], "1200") == 0) mode = CODEC2_MODE_1200; else if (strcmp(argv[1], "700C") == 0) mode = CODEC2_MODE_700C; else if (strcmp(argv[1], "450") == 0) mode = CODEC2_MODE_450; else if (strcmp(argv[1], "450PWB") == 0) mode = CODEC2_MODE_450; else { fprintf(stderr, "Error in mode: %s. Must be 3200, 2400, 1600, 1400, 1300, 1200, " "700C, 450, 450PWB or WB\n", argv[1]); exit(1); } if (strcmp(argv[2], "-") == 0) fin = stdin; else if ((fin = fopen(argv[2], "rb")) == NULL) { fprintf(stderr, "Error opening input speech file: %s: %s.\n", argv[2], strerror(errno)); exit(1); } if (strcmp(argv[3], "-") == 0) fout = stdout; else if ((fout = fopen(argv[3], "wb")) == NULL) { fprintf(stderr, "Error opening output compressed bit file: %s: %s.\n", argv[3], strerror(errno)); exit(1); } // Write a header if we're writing to a .c2 file char *ext = strrchr(argv[3], '.'); if (ext != NULL) { if (strcmp(ext, ".c2") == 0) { struct c2_header out_hdr; memcpy(out_hdr.magic, c2_file_magic, sizeof(c2_file_magic)); out_hdr.mode = mode; out_hdr.version_major = CODEC2_VERSION_MAJOR; out_hdr.version_minor = CODEC2_VERSION_MINOR; // TODO: Handle flags (this block needs to be moved down) out_hdr.flags = 0; fwrite(&out_hdr, sizeof(out_hdr), 1, fout); }; }; codec2 = codec2_create(mode); nsam = codec2_samples_per_frame(codec2); nbit = codec2_bits_per_frame(codec2); buf = (short *)malloc(nsam * sizeof(short)); nbyte = (nbit + 7) / 8; bits = (unsigned char *)malloc(nbyte * sizeof(char)); unpacked_bits_float = (float *)malloc(nbit * sizeof(float)); unpacked_bits_char = (char *)malloc(nbit * sizeof(char)); gray = 1; softdec = 0; bitperchar = 0; for (i = 4; i < argc; i++) { if (strcmp(argv[i], "--natural") == 0) { gray = 0; } if (strcmp(argv[i], "--softdec") == 0) { softdec = 1; } if (strcmp(argv[i], "--bitperchar") == 0) { bitperchar = 1; } if (strcmp(argv[i], "--mlfeat") == 0) { /* dump machine learning features (700C only) */ codec2_open_mlfeat(codec2, argv[i + 1], argv[i + 2]); } if (strcmp(argv[i], "--loadcb") == 0) { /* load VQ stage (700C only) */ codec2_load_codebook(codec2, atoi(argv[i + 1]) - 1, argv[i + 2]); } if (strcmp(argv[i], "--var") == 0) { report_var = 1; } if (strcmp(argv[i], "--eq") == 0) { eq = 1; } } codec2_set_natural_or_gray(codec2, gray); codec2_700c_eq(codec2, eq); // fprintf(stderr,"gray: %d softdec: %d\n", gray, softdec); while (fread(buf, sizeof(short), nsam, fin) == (size_t)nsam) { codec2_encode(codec2, bits, buf); if (softdec || bitperchar) { /* unpack bits, MSB first, send as soft decision float */ bit = 7; byte = 0; for (i = 0; i < nbit; i++) { unpacked_bits_float[i] = 1.0 - 2.0 * ((bits[byte] >> bit) & 0x1); unpacked_bits_char[i] = (bits[byte] >> bit) & 0x1; bit--; if (bit < 0) { bit = 7; byte++; } } if (softdec) { fwrite(unpacked_bits_float, sizeof(float), nbit, fout); } if (bitperchar) { fwrite(unpacked_bits_char, sizeof(char), nbit, fout); } } else fwrite(bits, sizeof(char), nbyte, fout); // if this is in a pipeline, we probably don't want the usual // buffering to occur if (fout == stdout) fflush(stdout); } if (report_var) { float var = codec2_get_var(codec2); fprintf(stderr, "%s var: %5.2f std: %5.2f\n", argv[2], var, sqrt(var)); } codec2_destroy(codec2); free(buf); free(bits); free(unpacked_bits_float); free(unpacked_bits_char); fclose(fin); fclose(fout); return 0; }