codec2/src/c2enc.c

208 lines
5.8 KiB
C

/*---------------------------------------------------------------------------*\
FILE........: c2enc.c
AUTHOR......: David Rowe
DATE CREATED: 23/8/2010
Encodes a file of raw speech samples using codec2 and outputs a file
of bits.
\*---------------------------------------------------------------------------*/
/*
Copyright (C) 2010 David Rowe
All rights reserved.
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU Lesser General Public License version 2.1, as
published by the Free Software Foundation. This program is
distributed in the hope that it will be useful, but WITHOUT ANY
WARRANTY; without even the implied warranty of MERCHANTABILITY or
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public
License for more details.
You should have received a copy of the GNU Lesser General Public License
along with this program; if not, see <http://www.gnu.org/licenses/>.
*/
#include <errno.h>
#include <math.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "c2file.h"
#include "codec2.h"
int main(int argc, char *argv[]) {
int mode;
void *codec2;
FILE *fin;
FILE *fout;
short *buf;
unsigned char *bits;
int nsam, nbit, nbyte, gray, softdec, bitperchar;
float *unpacked_bits_float;
char *unpacked_bits_char;
int bit, byte, i;
int report_var = 0;
int eq = 0;
if (argc < 4) {
printf(
"usage: c2enc 3200|2400|1600|1400|1300|1200|700C "
"InputRawspeechFile OutputBitFile [--natural] [--softdec] "
"[--bitperchar] [--mlfeat f32File modelFile] [--loadcb stageNum "
"Filename] [--var] [--eq]\n");
printf("e.g. (headerless) c2enc 1300 ../raw/hts1a.raw hts1a.bin\n");
printf(
"e.g. (with header to detect mode) c2enc 1300 ../raw/hts1a.raw "
"hts1a.c2\n");
exit(1);
}
if (strcmp(argv[1], "3200") == 0)
mode = CODEC2_MODE_3200;
else if (strcmp(argv[1], "2400") == 0)
mode = CODEC2_MODE_2400;
else if (strcmp(argv[1], "1600") == 0)
mode = CODEC2_MODE_1600;
else if (strcmp(argv[1], "1400") == 0)
mode = CODEC2_MODE_1400;
else if (strcmp(argv[1], "1300") == 0)
mode = CODEC2_MODE_1300;
else if (strcmp(argv[1], "1200") == 0)
mode = CODEC2_MODE_1200;
else if (strcmp(argv[1], "700C") == 0)
mode = CODEC2_MODE_700C;
else {
fprintf(stderr,
"Error in mode: %s. Must be 3200, 2400, 1600, 1400, 1300, 1200, "
"700C\n",
argv[1]);
exit(1);
}
if (strcmp(argv[2], "-") == 0)
fin = stdin;
else if ((fin = fopen(argv[2], "rb")) == NULL) {
fprintf(stderr, "Error opening input speech file: %s: %s.\n", argv[2],
strerror(errno));
exit(1);
}
if (strcmp(argv[3], "-") == 0)
fout = stdout;
else if ((fout = fopen(argv[3], "wb")) == NULL) {
fprintf(stderr, "Error opening output compressed bit file: %s: %s.\n",
argv[3], strerror(errno));
exit(1);
}
// Write a header if we're writing to a .c2 file
char *ext = strrchr(argv[3], '.');
if (ext != NULL) {
if (strcmp(ext, ".c2") == 0) {
struct c2_header out_hdr;
memcpy(out_hdr.magic, c2_file_magic, sizeof(c2_file_magic));
out_hdr.mode = mode;
out_hdr.version_major = CODEC2_VERSION_MAJOR;
out_hdr.version_minor = CODEC2_VERSION_MINOR;
// TODO: Handle flags (this block needs to be moved down)
out_hdr.flags = 0;
fwrite(&out_hdr, sizeof(out_hdr), 1, fout);
};
};
codec2 = codec2_create(mode);
nsam = codec2_samples_per_frame(codec2);
nbit = codec2_bits_per_frame(codec2);
buf = (short *)malloc(nsam * sizeof(short));
nbyte = (nbit + 7) / 8;
bits = (unsigned char *)malloc(nbyte * sizeof(char));
unpacked_bits_float = (float *)malloc(nbit * sizeof(float));
unpacked_bits_char = (char *)malloc(nbit * sizeof(char));
gray = 1;
softdec = 0;
bitperchar = 0;
for (i = 4; i < argc; i++) {
if (strcmp(argv[i], "--natural") == 0) {
gray = 0;
}
if (strcmp(argv[i], "--softdec") == 0) {
softdec = 1;
}
if (strcmp(argv[i], "--bitperchar") == 0) {
bitperchar = 1;
}
if (strcmp(argv[i], "--mlfeat") == 0) {
/* dump machine learning features (700C only) */
codec2_open_mlfeat(codec2, argv[i + 1], argv[i + 2]);
}
if (strcmp(argv[i], "--loadcb") == 0) {
/* load VQ stage (700C only) */
codec2_load_codebook(codec2, atoi(argv[i + 1]) - 1, argv[i + 2]);
}
if (strcmp(argv[i], "--var") == 0) {
report_var = 1;
}
if (strcmp(argv[i], "--eq") == 0) {
eq = 1;
}
}
codec2_set_natural_or_gray(codec2, gray);
codec2_700c_eq(codec2, eq);
// fprintf(stderr,"gray: %d softdec: %d\n", gray, softdec);
while (fread(buf, sizeof(short), nsam, fin) == (size_t)nsam) {
codec2_encode(codec2, bits, buf);
if (softdec || bitperchar) {
/* unpack bits, MSB first, send as soft decision float */
bit = 7;
byte = 0;
for (i = 0; i < nbit; i++) {
unpacked_bits_float[i] = 1.0 - 2.0 * ((bits[byte] >> bit) & 0x1);
unpacked_bits_char[i] = (bits[byte] >> bit) & 0x1;
bit--;
if (bit < 0) {
bit = 7;
byte++;
}
}
if (softdec) {
fwrite(unpacked_bits_float, sizeof(float), nbit, fout);
}
if (bitperchar) {
fwrite(unpacked_bits_char, sizeof(char), nbit, fout);
}
} else
fwrite(bits, sizeof(char), nbyte, fout);
// if this is in a pipeline, we probably don't want the usual
// buffering to occur
if (fout == stdout) fflush(stdout);
}
if (report_var) {
float var = codec2_get_var(codec2);
fprintf(stderr, "%s var: %5.2f std: %5.2f\n", argv[2], var, sqrt(var));
}
codec2_destroy(codec2);
free(buf);
free(bits);
free(unpacked_bits_float);
free(unpacked_bits_char);
fclose(fin);
fclose(fout);
return 0;
}