blob: 4b48b5033a53ec13c0fcded40291ad41b1b87631 [file] [log] [blame]
/*
* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
*
* Use of this source code is governed by a BSD-style license
* that can be found in the LICENSE file in the root of the source
* tree. An additional intellectual property rights grant can be found
* in the file PATENTS. All contributing project authors may
* be found in the AUTHORS file in the root of the source tree.
*/
/* kenny.c - Main function for the iSAC coder */
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>
#ifdef WIN32
#include "windows.h"
#ifndef CLOCKS_PER_SEC
#define CLOCKS_PER_SEC 1000
#endif
#endif
#include <ctype.h>
#include <math.h>
/* include API */
#include "modules/audio_coding/codecs/isac/main/include/isac.h"
#include "modules/audio_coding/codecs/isac/main/util/utility.h"
#include "rtc_base/format_macros.h"
/* max number of samples per frame (= 60 ms frame) */
#define MAX_FRAMESAMPLES_SWB 1920
/* number of samples per 10ms frame */
#define FRAMESAMPLES_SWB_10ms 320
#define FRAMESAMPLES_WB_10ms 160
/* sampling frequency (Hz) */
#define FS_SWB 32000
#define FS_WB 16000
unsigned long framecnt = 0;
int main(int argc, char* argv[]) {
//--- File IO ----
FILE* inp;
FILE* outp;
char inname[500];
char outname[500];
/* Runtime statistics */
double rate;
double rateRCU;
size_t totalbits = 0;
unsigned long totalBitsRCU = 0;
unsigned long totalsmpls = 0;
int32_t bottleneck = 39;
int frameSize = 30; /* ms */
int16_t codingMode = 1;
int16_t shortdata[FRAMESAMPLES_SWB_10ms];
int16_t decoded[MAX_FRAMESAMPLES_SWB];
int16_t speechType[1];
int16_t payloadLimit;
int32_t rateLimit;
ISACStruct* ISAC_main_inst;
size_t stream_len = 0;
int declen = 0;
int16_t err;
int cur_framesmpls;
int endfile;
#ifdef WIN32
double length_file;
double runtime;
char outDrive[10];
char outPath[500];
char outPrefix[500];
char outSuffix[500];
char bitrateFileName[500];
FILE* bitrateFile;
double starttime;
double rateLB = 0;
double rateUB = 0;
#endif
FILE* histFile;
FILE* averageFile;
int sampFreqKHz;
int samplesIn10Ms;
size_t maxStreamLen = 0;
char histFileName[500];
char averageFileName[500];
unsigned int hist[600];
double tmpSumStreamLen = 0;
unsigned int packetCntr = 0;
unsigned int lostPacketCntr = 0;
uint8_t payload[1200];
uint8_t payloadRCU[1200];
uint16_t packetLossPercent = 0;
int16_t rcuStreamLen = 0;
int onlyEncode;
int onlyDecode;
BottleNeckModel packetData;
packetData.arrival_time = 0;
packetData.sample_count = 0;
packetData.rtp_number = 0;
memset(hist, 0, sizeof(hist));
/* handling wrong input arguments in the command line */
if (argc < 5) {
int size;
WebRtcIsac_AssignSize(&size);
printf("\n\nWrong number of arguments or flag values.\n\n");
printf("Usage:\n\n");
printf("%s infile outfile -bn bottleneck [options]\n\n", argv[0]);
printf("with:\n");
printf("-I.............. indicates encoding in instantaneous mode.\n");
printf("-bn bottleneck.. the value of the bottleneck in bit/sec, e.g.\n");
printf(" 39742, in instantaneous (channel-independent)\n");
printf(" mode.\n\n");
printf("infile.......... Normal speech input file\n\n");
printf("outfile......... Speech output file\n\n");
printf("OPTIONS\n");
printf("-------\n");
printf("-fs sampFreq.... sampling frequency of codec 16 or 32 (default)\n");
printf(" kHz.\n");
printf("-plim payloadLim payload limit in bytes, default is the maximum\n");
printf(" possible.\n");
printf("-rlim rateLim... rate limit in bits/sec, default is the maximum\n");
printf(" possible.\n");
printf("-h file......... record histogram and *append* to 'file'.\n");
printf("-ave file....... record average rate of 3 sec intervales and\n");
printf(" *append* to 'file'.\n");
printf("-ploss.......... packet-loss percentage.\n");
printf("-enc............ do only encoding and store the bit-stream\n");
printf("-dec............ the input file is a bit-stream, decode it.\n\n");
printf("Example usage:\n\n");
printf("%s speechIn.pcm speechOut.pcm -B 40000 -fs 32\n\n", argv[0]);
printf("structure size %d bytes\n", size);
exit(0);
}
/* Get Bottleneck value */
bottleneck = readParamInt(argc, argv, "-bn", 50000);
fprintf(stderr, "\nfixed bottleneck rate of %d bits/s\n\n", bottleneck);
/* Get Input and Output files */
sscanf(argv[1], "%s", inname);
sscanf(argv[2], "%s", outname);
codingMode = readSwitch(argc, argv, "-I");
sampFreqKHz = (int16_t)readParamInt(argc, argv, "-fs", 32);
if (readParamString(argc, argv, "-h", histFileName, 500) > 0) {
histFile = fopen(histFileName, "a");
if (histFile == NULL) {
printf("cannot open hist file %s", histFileName);
exit(0);
}
} else {
// NO recording of hitstogram
histFile = NULL;
}
packetLossPercent = readParamInt(argc, argv, "-ploss", 0);
if (readParamString(argc, argv, "-ave", averageFileName, 500) > 0) {
averageFile = fopen(averageFileName, "a");
if (averageFile == NULL) {
printf("cannot open file to write rate %s", averageFileName);
exit(0);
}
} else {
averageFile = NULL;
}
onlyEncode = readSwitch(argc, argv, "-enc");
onlyDecode = readSwitch(argc, argv, "-dec");
switch (sampFreqKHz) {
case 16: {
samplesIn10Ms = 160;
break;
}
case 32: {
samplesIn10Ms = 320;
break;
}
default:
printf("A sampling frequency of %d kHz is not supported, valid values are"
" 8 and 16.\n", sampFreqKHz);
exit(-1);
}
payloadLimit = (int16_t)readParamInt(argc, argv, "-plim", 400);
rateLimit = readParamInt(argc, argv, "-rlim", 106800);
if ((inp = fopen(inname, "rb")) == NULL) {
printf(" iSAC: Cannot read file %s.\n", inname);
exit(1);
}
if ((outp = fopen(outname, "wb")) == NULL) {
printf(" iSAC: Cannot write file %s.\n", outname);
exit(1);
}
#ifdef WIN32
_splitpath(outname, outDrive, outPath, outPrefix, outSuffix);
_makepath(bitrateFileName, outDrive, outPath, "bitrate", ".txt");
bitrateFile = fopen(bitrateFileName, "a");
fprintf(bitrateFile, "%% %s \n", inname);
#endif
printf("\n");
printf("Input.................... %s\n", inname);
printf("Output................... %s\n", outname);
printf("Encoding Mode............ %s\n",
(codingMode == 1) ? "Channel-Independent" : "Channel-Adaptive");
printf("Bottleneck............... %d bits/sec\n", bottleneck);
printf("Packet-loss Percentage... %d\n", packetLossPercent);
printf("\n");
#ifdef WIN32
starttime = clock() / (double)CLOCKS_PER_SEC; /* Runtime statistics */
#endif
/* Initialize the ISAC and BN structs */
err = WebRtcIsac_Create(&ISAC_main_inst);
WebRtcIsac_SetEncSampRate(ISAC_main_inst, sampFreqKHz * 1000);
WebRtcIsac_SetDecSampRate(ISAC_main_inst, sampFreqKHz >= 32 ? 32000 : 16000);
/* Error check */
if (err < 0) {
fprintf(stderr, "\n\n Error in create.\n\n");
exit(EXIT_FAILURE);
}
framecnt = 0;
endfile = 0;
/* Initialize encoder and decoder */
if (WebRtcIsac_EncoderInit(ISAC_main_inst, codingMode) < 0) {
printf("cannot initialize encoder\n");
return -1;
}
WebRtcIsac_DecoderInit(ISAC_main_inst);
if (codingMode == 1) {
if (WebRtcIsac_Control(ISAC_main_inst, bottleneck, frameSize) < 0) {
printf("cannot set bottleneck\n");
return -1;
}
} else {
if (WebRtcIsac_ControlBwe(ISAC_main_inst, 15000, 30, 1) < 0) {
printf("cannot configure BWE\n");
return -1;
}
}
if (WebRtcIsac_SetMaxPayloadSize(ISAC_main_inst, payloadLimit) < 0) {
printf("cannot set maximum payload size %d.\n", payloadLimit);
return -1;
}
if (rateLimit < 106800) {
if (WebRtcIsac_SetMaxRate(ISAC_main_inst, rateLimit) < 0) {
printf("cannot set the maximum rate %d.\n", rateLimit);
return -1;
}
}
while (endfile == 0) {
fprintf(stderr, " \rframe = %7li", framecnt);
//============== Readind from the file and encoding =================
cur_framesmpls = 0;
stream_len = 0;
if (onlyDecode) {
uint8_t auxUW8;
if (fread(&auxUW8, sizeof(uint8_t), 1, inp) < 1) {
break;
}
stream_len = auxUW8 << 8;
if (fread(&auxUW8, sizeof(uint8_t), 1, inp) < 1) {
break;
}
stream_len |= auxUW8;
if (fread(payload, 1, stream_len, inp) < stream_len) {
printf("last payload is corrupted\n");
break;
}
} else {
while (stream_len == 0) {
int stream_len_int;
// Read 10 ms speech block
endfile = readframe(shortdata, inp, samplesIn10Ms);
if (endfile) {
break;
}
cur_framesmpls += samplesIn10Ms;
//-------- iSAC encoding ---------
stream_len_int = WebRtcIsac_Encode(ISAC_main_inst, shortdata, payload);
if (stream_len_int < 0) {
// exit if returned with error
// errType=WebRtcIsac_GetErrorCode(ISAC_main_inst);
fprintf(stderr, "\nError in encoder\n");
getc(stdin);
exit(EXIT_FAILURE);
}
stream_len = (size_t)stream_len_int;
}
//===================================================================
if (endfile) {
break;
}
rcuStreamLen = WebRtcIsac_GetRedPayload(ISAC_main_inst, payloadRCU);
if (rcuStreamLen < 0) {
fprintf(stderr, "\nError getting RED payload\n");
getc(stdin);
exit(EXIT_FAILURE);
}
get_arrival_time(cur_framesmpls, stream_len, bottleneck, &packetData,
sampFreqKHz * 1000, sampFreqKHz * 1000);
if (WebRtcIsac_UpdateBwEstimate(
ISAC_main_inst, payload, stream_len, packetData.rtp_number,
packetData.sample_count, packetData.arrival_time) < 0) {
printf(" BWE Error at client\n");
return -1;
}
}
if (endfile) {
break;
}
maxStreamLen = (stream_len > maxStreamLen) ? stream_len : maxStreamLen;
packetCntr++;
hist[stream_len]++;
if (averageFile != NULL) {
tmpSumStreamLen += stream_len;
if (packetCntr == 100) {
// kbps
fprintf(averageFile, "%8.3f ",
tmpSumStreamLen * 8.0 / (30.0 * packetCntr));
packetCntr = 0;
tmpSumStreamLen = 0;
}
}
if (onlyEncode) {
uint8_t auxUW8;
auxUW8 = (uint8_t)(((stream_len & 0x7F00) >> 8) & 0xFF);
if (fwrite(&auxUW8, sizeof(uint8_t), 1, outp) != 1) {
return -1;
}
auxUW8 = (uint8_t)(stream_len & 0xFF);
if (fwrite(&auxUW8, sizeof(uint8_t), 1, outp) != 1) {
return -1;
}
if (fwrite(payload, 1, stream_len, outp) != stream_len) {
return -1;
}
} else {
//======================= iSAC decoding ===========================
if ((rand() % 100) < packetLossPercent) {
declen = WebRtcIsac_DecodeRcu(ISAC_main_inst, payloadRCU,
(size_t)rcuStreamLen, decoded,
speechType);
lostPacketCntr++;
} else {
declen = WebRtcIsac_Decode(ISAC_main_inst, payload, stream_len, decoded,
speechType);
}
if (declen <= 0) {
// errType=WebRtcIsac_GetErrorCode(ISAC_main_inst);
fprintf(stderr, "\nError in decoder.\n");
getc(stdin);
exit(1);
}
// Write decoded speech frame to file
if (fwrite(decoded, sizeof(int16_t), declen, outp) != (size_t)declen) {
return -1;
}
cur_framesmpls = declen;
}
// Update Statistics
framecnt++;
totalsmpls += cur_framesmpls;
if (stream_len > 0) {
totalbits += 8 * stream_len;
}
if (rcuStreamLen > 0) {
totalBitsRCU += 8 * rcuStreamLen;
}
}
rate = ((double)totalbits * (sampFreqKHz)) / (double)totalsmpls;
rateRCU = ((double)totalBitsRCU * (sampFreqKHz)) / (double)totalsmpls;
printf("\n\n");
printf("Sampling Rate............... %d kHz\n", sampFreqKHz);
printf("Payload Limit............... %d bytes \n", payloadLimit);
printf("Rate Limit.................. %d bits/sec \n", rateLimit);
#ifdef WIN32
fprintf(bitrateFile, "%d %10lu %d %6.3f %6.3f %6.3f\n",
sampFreqKHz, framecnt, bottleneck, rateLB, rateUB, rate);
fclose(bitrateFile);
#endif // WIN32
printf("\n");
printf("Measured bit-rate........... %0.3f kbps\n", rate);
printf("Measured RCU bit-ratre...... %0.3f kbps\n", rateRCU);
printf("Maximum bit-rate/payloadsize %0.3f / %" PRIuS "\n",
maxStreamLen * 8 / 0.03, maxStreamLen);
printf("Measured packet-loss........ %0.1f%% \n",
100.0f * (float)lostPacketCntr / (float)packetCntr);
printf("\n");
/* Runtime statistics */
#ifdef WIN32
runtime = (double)(clock() / (double)CLOCKS_PER_SEC - starttime);
length_file = ((double)framecnt * (double)declen / (sampFreqKHz * 1000));
printf("Length of speech file....... %.1f s\n", length_file);
printf("Time to run iSAC............ %.2f s (%.2f %% of realtime)\n\n",
runtime, (100 * runtime / length_file));
#endif
printf("\n\n_______________________________________________\n");
if (histFile != NULL) {
int n;
for (n = 0; n < 600; n++) {
fprintf(histFile, "%6d ", hist[n]);
}
fprintf(histFile, "\n");
fclose(histFile);
}
if (averageFile != NULL) {
if (packetCntr > 0) {
fprintf(averageFile, "%8.3f ",
tmpSumStreamLen * 8.0 / (30.0 * packetCntr));
}
fprintf(averageFile, "\n");
fclose(averageFile);
}
fclose(inp);
fclose(outp);
WebRtcIsac_Free(ISAC_main_inst);
exit(0);
}