mirror of
https://github.com/mollyim/webrtc.git
synced 2025-05-16 07:10:38 +01:00

Bug: webrtc:9251 Change-Id: I7af3985d337082eea56164357119040383a37074 Reviewed-on: https://webrtc-review.googlesource.com/80483 Reviewed-by: Karl Wiberg <kwiberg@webrtc.org> Commit-Queue: Mirko Bonadei <mbonadei@webrtc.org> Cr-Commit-Position: refs/heads/master@{#23503}
467 lines
14 KiB
C
467 lines
14 KiB
C
/*
|
|
* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
/* kenny.c - Main function for the iSAC coder */
|
|
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
#include <time.h>
|
|
|
|
#ifdef WIN32
|
|
#include "windows.h"
|
|
#ifndef CLOCKS_PER_SEC
|
|
#define CLOCKS_PER_SEC 1000
|
|
#endif
|
|
#endif
|
|
|
|
#include <ctype.h>
|
|
#include <math.h>
|
|
|
|
/* include API */
|
|
#include "modules/audio_coding/codecs/isac/main/include/isac.h"
|
|
#include "modules/audio_coding/codecs/isac/main/util/utility.h"
|
|
#include "rtc_base/format_macros.h"
|
|
|
|
/* max number of samples per frame (= 60 ms frame) */
|
|
#define MAX_FRAMESAMPLES_SWB 1920
|
|
/* number of samples per 10ms frame */
|
|
#define FRAMESAMPLES_SWB_10ms 320
|
|
#define FRAMESAMPLES_WB_10ms 160
|
|
|
|
/* sampling frequency (Hz) */
|
|
#define FS_SWB 32000
|
|
#define FS_WB 16000
|
|
|
|
unsigned long framecnt = 0;
|
|
|
|
int main(int argc, char* argv[]) {
|
|
//--- File IO ----
|
|
FILE* inp;
|
|
FILE* outp;
|
|
char inname[500];
|
|
char outname[500];
|
|
|
|
/* Runtime statistics */
|
|
double rate;
|
|
double rateRCU;
|
|
size_t totalbits = 0;
|
|
unsigned long totalBitsRCU = 0;
|
|
unsigned long totalsmpls = 0;
|
|
|
|
int32_t bottleneck = 39;
|
|
int frameSize = 30; /* ms */
|
|
int16_t codingMode = 1;
|
|
int16_t shortdata[FRAMESAMPLES_SWB_10ms];
|
|
int16_t decoded[MAX_FRAMESAMPLES_SWB];
|
|
int16_t speechType[1];
|
|
int16_t payloadLimit;
|
|
int32_t rateLimit;
|
|
ISACStruct* ISAC_main_inst;
|
|
|
|
size_t stream_len = 0;
|
|
int declen = 0;
|
|
int16_t err;
|
|
int cur_framesmpls;
|
|
int endfile;
|
|
#ifdef WIN32
|
|
double length_file;
|
|
double runtime;
|
|
char outDrive[10];
|
|
char outPath[500];
|
|
char outPrefix[500];
|
|
char outSuffix[500];
|
|
char bitrateFileName[500];
|
|
FILE* bitrateFile;
|
|
double starttime;
|
|
double rateLB = 0;
|
|
double rateUB = 0;
|
|
#endif
|
|
FILE* histFile;
|
|
FILE* averageFile;
|
|
int sampFreqKHz;
|
|
int samplesIn10Ms;
|
|
size_t maxStreamLen = 0;
|
|
char histFileName[500];
|
|
char averageFileName[500];
|
|
unsigned int hist[600];
|
|
double tmpSumStreamLen = 0;
|
|
unsigned int packetCntr = 0;
|
|
unsigned int lostPacketCntr = 0;
|
|
uint8_t payload[1200];
|
|
uint8_t payloadRCU[1200];
|
|
uint16_t packetLossPercent = 0;
|
|
int16_t rcuStreamLen = 0;
|
|
int onlyEncode;
|
|
int onlyDecode;
|
|
|
|
BottleNeckModel packetData;
|
|
packetData.arrival_time = 0;
|
|
packetData.sample_count = 0;
|
|
packetData.rtp_number = 0;
|
|
memset(hist, 0, sizeof(hist));
|
|
|
|
/* handling wrong input arguments in the command line */
|
|
if (argc < 5) {
|
|
int size;
|
|
WebRtcIsac_AssignSize(&size);
|
|
|
|
printf("\n\nWrong number of arguments or flag values.\n\n");
|
|
|
|
printf("Usage:\n\n");
|
|
printf("%s infile outfile -bn bottleneck [options]\n\n", argv[0]);
|
|
printf("with:\n");
|
|
printf("-I.............. indicates encoding in instantaneous mode.\n");
|
|
printf("-bn bottleneck.. the value of the bottleneck in bit/sec, e.g.\n");
|
|
printf(" 39742, in instantaneous (channel-independent)\n");
|
|
printf(" mode.\n\n");
|
|
printf("infile.......... Normal speech input file\n\n");
|
|
printf("outfile......... Speech output file\n\n");
|
|
printf("OPTIONS\n");
|
|
printf("-------\n");
|
|
printf("-fs sampFreq.... sampling frequency of codec 16 or 32 (default)\n");
|
|
printf(" kHz.\n");
|
|
printf("-plim payloadLim payload limit in bytes, default is the maximum\n");
|
|
printf(" possible.\n");
|
|
printf("-rlim rateLim... rate limit in bits/sec, default is the maximum\n");
|
|
printf(" possible.\n");
|
|
printf("-h file......... record histogram and *append* to 'file'.\n");
|
|
printf("-ave file....... record average rate of 3 sec intervales and\n");
|
|
printf(" *append* to 'file'.\n");
|
|
printf("-ploss.......... packet-loss percentage.\n");
|
|
printf("-enc............ do only encoding and store the bit-stream\n");
|
|
printf("-dec............ the input file is a bit-stream, decode it.\n\n");
|
|
printf("Example usage:\n\n");
|
|
printf("%s speechIn.pcm speechOut.pcm -B 40000 -fs 32\n\n", argv[0]);
|
|
printf("structure size %d bytes\n", size);
|
|
|
|
exit(0);
|
|
}
|
|
|
|
/* Get Bottleneck value */
|
|
bottleneck = readParamInt(argc, argv, "-bn", 50000);
|
|
fprintf(stderr, "\nfixed bottleneck rate of %d bits/s\n\n", bottleneck);
|
|
|
|
/* Get Input and Output files */
|
|
sscanf(argv[1], "%s", inname);
|
|
sscanf(argv[2], "%s", outname);
|
|
codingMode = readSwitch(argc, argv, "-I");
|
|
sampFreqKHz = (int16_t)readParamInt(argc, argv, "-fs", 32);
|
|
if (readParamString(argc, argv, "-h", histFileName, 500) > 0) {
|
|
histFile = fopen(histFileName, "a");
|
|
if (histFile == NULL) {
|
|
printf("cannot open hist file %s", histFileName);
|
|
exit(0);
|
|
}
|
|
} else {
|
|
// NO recording of hitstogram
|
|
histFile = NULL;
|
|
}
|
|
|
|
packetLossPercent = readParamInt(argc, argv, "-ploss", 0);
|
|
|
|
if (readParamString(argc, argv, "-ave", averageFileName, 500) > 0) {
|
|
averageFile = fopen(averageFileName, "a");
|
|
if (averageFile == NULL) {
|
|
printf("cannot open file to write rate %s", averageFileName);
|
|
exit(0);
|
|
}
|
|
} else {
|
|
averageFile = NULL;
|
|
}
|
|
|
|
onlyEncode = readSwitch(argc, argv, "-enc");
|
|
onlyDecode = readSwitch(argc, argv, "-dec");
|
|
|
|
switch (sampFreqKHz) {
|
|
case 16: {
|
|
samplesIn10Ms = 160;
|
|
break;
|
|
}
|
|
case 32: {
|
|
samplesIn10Ms = 320;
|
|
break;
|
|
}
|
|
default:
|
|
printf("A sampling frequency of %d kHz is not supported, valid values are"
|
|
" 8 and 16.\n", sampFreqKHz);
|
|
exit(-1);
|
|
}
|
|
payloadLimit = (int16_t)readParamInt(argc, argv, "-plim", 400);
|
|
rateLimit = readParamInt(argc, argv, "-rlim", 106800);
|
|
|
|
if ((inp = fopen(inname, "rb")) == NULL) {
|
|
printf(" iSAC: Cannot read file %s.\n", inname);
|
|
exit(1);
|
|
}
|
|
if ((outp = fopen(outname, "wb")) == NULL) {
|
|
printf(" iSAC: Cannot write file %s.\n", outname);
|
|
exit(1);
|
|
}
|
|
|
|
#ifdef WIN32
|
|
_splitpath(outname, outDrive, outPath, outPrefix, outSuffix);
|
|
_makepath(bitrateFileName, outDrive, outPath, "bitrate", ".txt");
|
|
|
|
bitrateFile = fopen(bitrateFileName, "a");
|
|
fprintf(bitrateFile, "%% %s \n", inname);
|
|
#endif
|
|
|
|
printf("\n");
|
|
printf("Input.................... %s\n", inname);
|
|
printf("Output................... %s\n", outname);
|
|
printf("Encoding Mode............ %s\n",
|
|
(codingMode == 1) ? "Channel-Independent" : "Channel-Adaptive");
|
|
printf("Bottleneck............... %d bits/sec\n", bottleneck);
|
|
printf("Packet-loss Percentage... %d\n", packetLossPercent);
|
|
printf("\n");
|
|
|
|
#ifdef WIN32
|
|
starttime = clock() / (double)CLOCKS_PER_SEC; /* Runtime statistics */
|
|
#endif
|
|
|
|
/* Initialize the ISAC and BN structs */
|
|
err = WebRtcIsac_Create(&ISAC_main_inst);
|
|
|
|
WebRtcIsac_SetEncSampRate(ISAC_main_inst, sampFreqKHz * 1000);
|
|
WebRtcIsac_SetDecSampRate(ISAC_main_inst, sampFreqKHz >= 32 ? 32000 : 16000);
|
|
/* Error check */
|
|
if (err < 0) {
|
|
fprintf(stderr, "\n\n Error in create.\n\n");
|
|
exit(EXIT_FAILURE);
|
|
}
|
|
|
|
framecnt = 0;
|
|
endfile = 0;
|
|
|
|
/* Initialize encoder and decoder */
|
|
if (WebRtcIsac_EncoderInit(ISAC_main_inst, codingMode) < 0) {
|
|
printf("cannot initialize encoder\n");
|
|
return -1;
|
|
}
|
|
WebRtcIsac_DecoderInit(ISAC_main_inst);
|
|
|
|
if (codingMode == 1) {
|
|
if (WebRtcIsac_Control(ISAC_main_inst, bottleneck, frameSize) < 0) {
|
|
printf("cannot set bottleneck\n");
|
|
return -1;
|
|
}
|
|
} else {
|
|
if (WebRtcIsac_ControlBwe(ISAC_main_inst, 15000, 30, 1) < 0) {
|
|
printf("cannot configure BWE\n");
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
if (WebRtcIsac_SetMaxPayloadSize(ISAC_main_inst, payloadLimit) < 0) {
|
|
printf("cannot set maximum payload size %d.\n", payloadLimit);
|
|
return -1;
|
|
}
|
|
|
|
if (rateLimit < 106800) {
|
|
if (WebRtcIsac_SetMaxRate(ISAC_main_inst, rateLimit) < 0) {
|
|
printf("cannot set the maximum rate %d.\n", rateLimit);
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
while (endfile == 0) {
|
|
fprintf(stderr, " \rframe = %7li", framecnt);
|
|
|
|
//============== Readind from the file and encoding =================
|
|
cur_framesmpls = 0;
|
|
stream_len = 0;
|
|
|
|
if (onlyDecode) {
|
|
uint8_t auxUW8;
|
|
if (fread(&auxUW8, sizeof(uint8_t), 1, inp) < 1) {
|
|
break;
|
|
}
|
|
stream_len = auxUW8 << 8;
|
|
if (fread(&auxUW8, sizeof(uint8_t), 1, inp) < 1) {
|
|
break;
|
|
}
|
|
stream_len |= auxUW8;
|
|
if (fread(payload, 1, stream_len, inp) < stream_len) {
|
|
printf("last payload is corrupted\n");
|
|
break;
|
|
}
|
|
} else {
|
|
while (stream_len == 0) {
|
|
int stream_len_int;
|
|
|
|
// Read 10 ms speech block
|
|
endfile = readframe(shortdata, inp, samplesIn10Ms);
|
|
if (endfile) {
|
|
break;
|
|
}
|
|
cur_framesmpls += samplesIn10Ms;
|
|
|
|
//-------- iSAC encoding ---------
|
|
stream_len_int = WebRtcIsac_Encode(ISAC_main_inst, shortdata, payload);
|
|
|
|
if (stream_len_int < 0) {
|
|
// exit if returned with error
|
|
// errType=WebRtcIsac_GetErrorCode(ISAC_main_inst);
|
|
fprintf(stderr, "\nError in encoder\n");
|
|
getc(stdin);
|
|
exit(EXIT_FAILURE);
|
|
}
|
|
stream_len = (size_t)stream_len_int;
|
|
}
|
|
//===================================================================
|
|
if (endfile) {
|
|
break;
|
|
}
|
|
|
|
rcuStreamLen = WebRtcIsac_GetRedPayload(ISAC_main_inst, payloadRCU);
|
|
if (rcuStreamLen < 0) {
|
|
fprintf(stderr, "\nError getting RED payload\n");
|
|
getc(stdin);
|
|
exit(EXIT_FAILURE);
|
|
}
|
|
|
|
get_arrival_time(cur_framesmpls, stream_len, bottleneck, &packetData,
|
|
sampFreqKHz * 1000, sampFreqKHz * 1000);
|
|
if (WebRtcIsac_UpdateBwEstimate(
|
|
ISAC_main_inst, payload, stream_len, packetData.rtp_number,
|
|
packetData.sample_count, packetData.arrival_time) < 0) {
|
|
printf(" BWE Error at client\n");
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
if (endfile) {
|
|
break;
|
|
}
|
|
|
|
maxStreamLen = (stream_len > maxStreamLen) ? stream_len : maxStreamLen;
|
|
packetCntr++;
|
|
|
|
hist[stream_len]++;
|
|
if (averageFile != NULL) {
|
|
tmpSumStreamLen += stream_len;
|
|
if (packetCntr == 100) {
|
|
// kbps
|
|
fprintf(averageFile, "%8.3f ",
|
|
tmpSumStreamLen * 8.0 / (30.0 * packetCntr));
|
|
packetCntr = 0;
|
|
tmpSumStreamLen = 0;
|
|
}
|
|
}
|
|
|
|
if (onlyEncode) {
|
|
uint8_t auxUW8;
|
|
auxUW8 = (uint8_t)(((stream_len & 0x7F00) >> 8) & 0xFF);
|
|
if (fwrite(&auxUW8, sizeof(uint8_t), 1, outp) != 1) {
|
|
return -1;
|
|
}
|
|
|
|
auxUW8 = (uint8_t)(stream_len & 0xFF);
|
|
if (fwrite(&auxUW8, sizeof(uint8_t), 1, outp) != 1) {
|
|
return -1;
|
|
}
|
|
if (fwrite(payload, 1, stream_len, outp) != stream_len) {
|
|
return -1;
|
|
}
|
|
} else {
|
|
//======================= iSAC decoding ===========================
|
|
|
|
if ((rand() % 100) < packetLossPercent) {
|
|
declen = WebRtcIsac_DecodeRcu(ISAC_main_inst, payloadRCU,
|
|
(size_t)rcuStreamLen, decoded,
|
|
speechType);
|
|
lostPacketCntr++;
|
|
} else {
|
|
declen = WebRtcIsac_Decode(ISAC_main_inst, payload, stream_len, decoded,
|
|
speechType);
|
|
}
|
|
if (declen <= 0) {
|
|
// errType=WebRtcIsac_GetErrorCode(ISAC_main_inst);
|
|
fprintf(stderr, "\nError in decoder.\n");
|
|
getc(stdin);
|
|
exit(1);
|
|
}
|
|
|
|
// Write decoded speech frame to file
|
|
if (fwrite(decoded, sizeof(int16_t), declen, outp) != (size_t)declen) {
|
|
return -1;
|
|
}
|
|
cur_framesmpls = declen;
|
|
}
|
|
// Update Statistics
|
|
framecnt++;
|
|
totalsmpls += cur_framesmpls;
|
|
if (stream_len > 0) {
|
|
totalbits += 8 * stream_len;
|
|
}
|
|
if (rcuStreamLen > 0) {
|
|
totalBitsRCU += 8 * rcuStreamLen;
|
|
}
|
|
}
|
|
|
|
rate = ((double)totalbits * (sampFreqKHz)) / (double)totalsmpls;
|
|
rateRCU = ((double)totalBitsRCU * (sampFreqKHz)) / (double)totalsmpls;
|
|
|
|
printf("\n\n");
|
|
printf("Sampling Rate............... %d kHz\n", sampFreqKHz);
|
|
printf("Payload Limit............... %d bytes \n", payloadLimit);
|
|
printf("Rate Limit.................. %d bits/sec \n", rateLimit);
|
|
|
|
#ifdef WIN32
|
|
fprintf(bitrateFile, "%d %10lu %d %6.3f %6.3f %6.3f\n",
|
|
sampFreqKHz, framecnt, bottleneck, rateLB, rateUB, rate);
|
|
fclose(bitrateFile);
|
|
#endif // WIN32
|
|
|
|
printf("\n");
|
|
printf("Measured bit-rate........... %0.3f kbps\n", rate);
|
|
printf("Measured RCU bit-ratre...... %0.3f kbps\n", rateRCU);
|
|
printf("Maximum bit-rate/payloadsize %0.3f / %" PRIuS "\n",
|
|
maxStreamLen * 8 / 0.03, maxStreamLen);
|
|
printf("Measured packet-loss........ %0.1f%% \n",
|
|
100.0f * (float)lostPacketCntr / (float)packetCntr);
|
|
|
|
printf("\n");
|
|
|
|
/* Runtime statistics */
|
|
#ifdef WIN32
|
|
runtime = (double)(clock() / (double)CLOCKS_PER_SEC - starttime);
|
|
length_file = ((double)framecnt * (double)declen / (sampFreqKHz * 1000));
|
|
printf("Length of speech file....... %.1f s\n", length_file);
|
|
printf("Time to run iSAC............ %.2f s (%.2f %% of realtime)\n\n",
|
|
runtime, (100 * runtime / length_file));
|
|
#endif
|
|
printf("\n\n_______________________________________________\n");
|
|
|
|
if (histFile != NULL) {
|
|
int n;
|
|
for (n = 0; n < 600; n++) {
|
|
fprintf(histFile, "%6d ", hist[n]);
|
|
}
|
|
fprintf(histFile, "\n");
|
|
fclose(histFile);
|
|
}
|
|
if (averageFile != NULL) {
|
|
if (packetCntr > 0) {
|
|
fprintf(averageFile, "%8.3f ",
|
|
tmpSumStreamLen * 8.0 / (30.0 * packetCntr));
|
|
}
|
|
fprintf(averageFile, "\n");
|
|
fclose(averageFile);
|
|
}
|
|
|
|
fclose(inp);
|
|
fclose(outp);
|
|
|
|
WebRtcIsac_Free(ISAC_main_inst);
|
|
|
|
exit(0);
|
|
}
|