| /* |
| * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
| * |
| * Use of this source code is governed by a BSD-style license |
| * that can be found in the LICENSE file in the root of the source |
| * tree. An additional intellectual property rights grant can be found |
| * in the file PATENTS. All contributing project authors may |
| * be found in the AUTHORS file in the root of the source tree. |
| */ |
| |
| /* |
| * structs.h |
| * |
| * This header file contains all the structs used in the ISAC codec |
| * |
| */ |
| |
| #ifndef MODULES_AUDIO_CODING_CODECS_ISAC_MAIN_SOURCE_STRUCTS_H_ |
| #define MODULES_AUDIO_CODING_CODECS_ISAC_MAIN_SOURCE_STRUCTS_H_ |
| |
| #include "modules/audio_coding/codecs/isac/bandwidth_info.h" |
| #include "modules/audio_coding/codecs/isac/main/source/settings.h" |
| #include "modules/third_party/fft/fft.h" |
| |
| typedef struct Bitstreamstruct { |
| uint8_t stream[STREAM_SIZE_MAX]; |
| uint32_t W_upper; |
| uint32_t streamval; |
| uint32_t stream_index; |
| |
| } Bitstr; |
| |
| typedef struct { |
| double DataBufferLo[WINLEN]; |
| double DataBufferHi[WINLEN]; |
| |
| double CorrBufLo[ORDERLO + 1]; |
| double CorrBufHi[ORDERHI + 1]; |
| |
| float PreStateLoF[ORDERLO + 1]; |
| float PreStateLoG[ORDERLO + 1]; |
| float PreStateHiF[ORDERHI + 1]; |
| float PreStateHiG[ORDERHI + 1]; |
| float PostStateLoF[ORDERLO + 1]; |
| float PostStateLoG[ORDERLO + 1]; |
| float PostStateHiF[ORDERHI + 1]; |
| float PostStateHiG[ORDERHI + 1]; |
| |
| double OldEnergy; |
| |
| } MaskFiltstr; |
| |
| typedef struct { |
| // state vectors for each of the two analysis filters |
| double INSTAT1[2 * (QORDER - 1)]; |
| double INSTAT2[2 * (QORDER - 1)]; |
| double INSTATLA1[2 * (QORDER - 1)]; |
| double INSTATLA2[2 * (QORDER - 1)]; |
| double INLABUF1[QLOOKAHEAD]; |
| double INLABUF2[QLOOKAHEAD]; |
| |
| float INSTAT1_float[2 * (QORDER - 1)]; |
| float INSTAT2_float[2 * (QORDER - 1)]; |
| float INSTATLA1_float[2 * (QORDER - 1)]; |
| float INSTATLA2_float[2 * (QORDER - 1)]; |
| float INLABUF1_float[QLOOKAHEAD]; |
| float INLABUF2_float[QLOOKAHEAD]; |
| |
| /* High pass filter */ |
| double HPstates[HPORDER]; |
| float HPstates_float[HPORDER]; |
| |
| } PreFiltBankstr; |
| |
| typedef struct { |
| // state vectors for each of the two analysis filters |
| double STATE_0_LOWER[2 * POSTQORDER]; |
| double STATE_0_UPPER[2 * POSTQORDER]; |
| |
| /* High pass filter */ |
| double HPstates1[HPORDER]; |
| double HPstates2[HPORDER]; |
| |
| float STATE_0_LOWER_float[2 * POSTQORDER]; |
| float STATE_0_UPPER_float[2 * POSTQORDER]; |
| |
| float HPstates1_float[HPORDER]; |
| float HPstates2_float[HPORDER]; |
| |
| } PostFiltBankstr; |
| |
| typedef struct { |
| // data buffer for pitch filter |
| double ubuf[PITCH_BUFFSIZE]; |
| |
| // low pass state vector |
| double ystate[PITCH_DAMPORDER]; |
| |
| // old lag and gain |
| double oldlagp[1]; |
| double oldgainp[1]; |
| |
| } PitchFiltstr; |
| |
| typedef struct { |
| // data buffer |
| double buffer[PITCH_WLPCBUFLEN]; |
| |
| // state vectors |
| double istate[PITCH_WLPCORDER]; |
| double weostate[PITCH_WLPCORDER]; |
| double whostate[PITCH_WLPCORDER]; |
| |
| // LPC window -> should be a global array because constant |
| double window[PITCH_WLPCWINLEN]; |
| |
| } WeightFiltstr; |
| |
| typedef struct { |
| // for inital estimator |
| double dec_buffer[PITCH_CORR_LEN2 + PITCH_CORR_STEP2 + PITCH_MAX_LAG / 2 - |
| PITCH_FRAME_LEN / 2 + 2]; |
| double decimator_state[2 * ALLPASSSECTIONS + 1]; |
| double hp_state[2]; |
| |
| double whitened_buf[QLOOKAHEAD]; |
| |
| double inbuf[QLOOKAHEAD]; |
| |
| PitchFiltstr PFstr_wght; |
| PitchFiltstr PFstr; |
| WeightFiltstr Wghtstr; |
| |
| } PitchAnalysisStruct; |
| |
| /* Have instance of struct together with other iSAC structs */ |
| typedef struct { |
| /* Previous frame length (in ms) */ |
| int32_t prev_frame_length; |
| |
| /* Previous RTP timestamp from received |
| packet (in samples relative beginning) */ |
| int32_t prev_rec_rtp_number; |
| |
| /* Send timestamp for previous packet (in ms using timeGetTime()) */ |
| uint32_t prev_rec_send_ts; |
| |
| /* Arrival time for previous packet (in ms using timeGetTime()) */ |
| uint32_t prev_rec_arr_ts; |
| |
| /* rate of previous packet, derived from RTP timestamps (in bits/s) */ |
| float prev_rec_rtp_rate; |
| |
| /* Time sinse the last update of the BN estimate (in ms) */ |
| uint32_t last_update_ts; |
| |
| /* Time sinse the last reduction (in ms) */ |
| uint32_t last_reduction_ts; |
| |
| /* How many times the estimate was update in the beginning */ |
| int32_t count_tot_updates_rec; |
| |
| /* The estimated bottle neck rate from there to here (in bits/s) */ |
| int32_t rec_bw; |
| float rec_bw_inv; |
| float rec_bw_avg; |
| float rec_bw_avg_Q; |
| |
| /* The estimated mean absolute jitter value, |
| as seen on this side (in ms) */ |
| float rec_jitter; |
| float rec_jitter_short_term; |
| float rec_jitter_short_term_abs; |
| float rec_max_delay; |
| float rec_max_delay_avg_Q; |
| |
| /* (assumed) bitrate for headers (bps) */ |
| float rec_header_rate; |
| |
| /* The estimated bottle neck rate from here to there (in bits/s) */ |
| float send_bw_avg; |
| |
| /* The estimated mean absolute jitter value, as seen on |
| the other siee (in ms) */ |
| float send_max_delay_avg; |
| |
| // number of packets received since last update |
| int num_pkts_rec; |
| |
| int num_consec_rec_pkts_over_30k; |
| |
| // flag for marking that a high speed network has been |
| // detected downstream |
| int hsn_detect_rec; |
| |
| int num_consec_snt_pkts_over_30k; |
| |
| // flag for marking that a high speed network has |
| // been detected upstream |
| int hsn_detect_snd; |
| |
| uint32_t start_wait_period; |
| |
| int in_wait_period; |
| |
| int change_to_WB; |
| |
| uint32_t senderTimestamp; |
| uint32_t receiverTimestamp; |
| // enum IsacSamplingRate incomingStreamSampFreq; |
| uint16_t numConsecLatePkts; |
| float consecLatency; |
| int16_t inWaitLatePkts; |
| |
| IsacBandwidthInfo external_bw_info; |
| } BwEstimatorstr; |
| |
| typedef struct { |
| /* boolean, flags if previous packet exceeded B.N. */ |
| int PrevExceed; |
| /* ms */ |
| int ExceedAgo; |
| /* packets left to send in current burst */ |
| int BurstCounter; |
| /* packets */ |
| int InitCounter; |
| /* ms remaining in buffer when next packet will be sent */ |
| double StillBuffered; |
| |
| } RateModel; |
| |
| /* The following strutc is used to store data from encoding, to make it |
| fast and easy to construct a new bitstream with a different Bandwidth |
| estimate. All values (except framelength and minBytes) is double size to |
| handle 60 ms of data. |
| */ |
| typedef struct { |
| /* Used to keep track of if it is first or second part of 60 msec packet */ |
| int startIdx; |
| |
| /* Frame length in samples */ |
| int16_t framelength; |
| |
| /* Pitch Gain */ |
| int pitchGain_index[2]; |
| |
| /* Pitch Lag */ |
| double meanGain[2]; |
| int pitchIndex[PITCH_SUBFRAMES * 2]; |
| |
| /* LPC */ |
| int LPCindex_s[108 * 2]; /* KLT_ORDER_SHAPE = 108 */ |
| int LPCindex_g[12 * 2]; /* KLT_ORDER_GAIN = 12 */ |
| double LPCcoeffs_lo[(ORDERLO + 1) * SUBFRAMES * 2]; |
| double LPCcoeffs_hi[(ORDERHI + 1) * SUBFRAMES * 2]; |
| |
| /* Encode Spec */ |
| int16_t fre[FRAMESAMPLES]; |
| int16_t fim[FRAMESAMPLES]; |
| int16_t AvgPitchGain[2]; |
| |
| /* Used in adaptive mode only */ |
| int minBytes; |
| |
| } IsacSaveEncoderData; |
| |
| typedef struct { |
| int indexLPCShape[UB_LPC_ORDER * UB16_LPC_VEC_PER_FRAME]; |
| double lpcGain[SUBFRAMES << 1]; |
| int lpcGainIndex[SUBFRAMES << 1]; |
| |
| Bitstr bitStreamObj; |
| |
| int16_t realFFT[FRAMESAMPLES_HALF]; |
| int16_t imagFFT[FRAMESAMPLES_HALF]; |
| } ISACUBSaveEncDataStruct; |
| |
| typedef struct { |
| Bitstr bitstr_obj; |
| MaskFiltstr maskfiltstr_obj; |
| PreFiltBankstr prefiltbankstr_obj; |
| PitchFiltstr pitchfiltstr_obj; |
| PitchAnalysisStruct pitchanalysisstr_obj; |
| FFTstr fftstr_obj; |
| IsacSaveEncoderData SaveEnc_obj; |
| |
| int buffer_index; |
| int16_t current_framesamples; |
| |
| float data_buffer_float[FRAMESAMPLES_30ms]; |
| |
| int frame_nb; |
| double bottleneck; |
| int16_t new_framelength; |
| double s2nr; |
| |
| /* Maximum allowed number of bits for a 30 msec packet */ |
| int16_t payloadLimitBytes30; |
| /* Maximum allowed number of bits for a 30 msec packet */ |
| int16_t payloadLimitBytes60; |
| /* Maximum allowed number of bits for both 30 and 60 msec packet */ |
| int16_t maxPayloadBytes; |
| /* Maximum allowed rate in bytes per 30 msec packet */ |
| int16_t maxRateInBytes; |
| |
| /*--- |
| If set to 1 iSAC will not addapt the frame-size, if used in |
| channel-adaptive mode. The initial value will be used for all rates. |
| ---*/ |
| int16_t enforceFrameSize; |
| |
| /*----- |
| This records the BWE index the encoder injected into the bit-stream. |
| It will be used in RCU. The same BWE index of main payload will be in |
| the redundant payload. We can not retrive it from BWE because it is |
| a recursive procedure (WebRtcIsac_GetDownlinkBwJitIndexImpl) and has to be |
| called only once per each encode. |
| -----*/ |
| int16_t lastBWIdx; |
| } ISACLBEncStruct; |
| |
| typedef struct { |
| Bitstr bitstr_obj; |
| MaskFiltstr maskfiltstr_obj; |
| PreFiltBankstr prefiltbankstr_obj; |
| FFTstr fftstr_obj; |
| ISACUBSaveEncDataStruct SaveEnc_obj; |
| |
| int buffer_index; |
| float data_buffer_float[MAX_FRAMESAMPLES + LB_TOTAL_DELAY_SAMPLES]; |
| double bottleneck; |
| /* Maximum allowed number of bits for a 30 msec packet */ |
| // int16_t payloadLimitBytes30; |
| /* Maximum allowed number of bits for both 30 and 60 msec packet */ |
| // int16_t maxPayloadBytes; |
| int16_t maxPayloadSizeBytes; |
| |
| double lastLPCVec[UB_LPC_ORDER]; |
| int16_t numBytesUsed; |
| int16_t lastJitterInfo; |
| } ISACUBEncStruct; |
| |
| typedef struct { |
| Bitstr bitstr_obj; |
| MaskFiltstr maskfiltstr_obj; |
| PostFiltBankstr postfiltbankstr_obj; |
| PitchFiltstr pitchfiltstr_obj; |
| FFTstr fftstr_obj; |
| |
| } ISACLBDecStruct; |
| |
| typedef struct { |
| Bitstr bitstr_obj; |
| MaskFiltstr maskfiltstr_obj; |
| PostFiltBankstr postfiltbankstr_obj; |
| FFTstr fftstr_obj; |
| |
| } ISACUBDecStruct; |
| |
| typedef struct { |
| ISACLBEncStruct ISACencLB_obj; |
| ISACLBDecStruct ISACdecLB_obj; |
| } ISACLBStruct; |
| |
| typedef struct { |
| ISACUBEncStruct ISACencUB_obj; |
| ISACUBDecStruct ISACdecUB_obj; |
| } ISACUBStruct; |
| |
| /* |
| This struct is used to take a snapshot of the entropy coder and LPC gains |
| right before encoding LPC gains. This allows us to go back to that state |
| if we like to limit the payload size. |
| */ |
| typedef struct { |
| /* 6 lower-band & 6 upper-band */ |
| double loFiltGain[SUBFRAMES]; |
| double hiFiltGain[SUBFRAMES]; |
| /* Upper boundary of interval W */ |
| uint32_t W_upper; |
| uint32_t streamval; |
| /* Index to the current position in bytestream */ |
| uint32_t stream_index; |
| uint8_t stream[3]; |
| } transcode_obj; |
| |
| typedef struct { |
| // TODO(kwiberg): The size of these tables could be reduced by storing floats |
| // instead of doubles, and by making use of the identity cos(x) = |
| // sin(x+pi/2). They could also be made global constants that we fill in at |
| // compile time. |
| double costab1[FRAMESAMPLES_HALF]; |
| double sintab1[FRAMESAMPLES_HALF]; |
| double costab2[FRAMESAMPLES_QUARTER]; |
| double sintab2[FRAMESAMPLES_QUARTER]; |
| } TransformTables; |
| |
| typedef struct { |
| // lower-band codec instance |
| ISACLBStruct instLB; |
| // upper-band codec instance |
| ISACUBStruct instUB; |
| |
| // Bandwidth Estimator and model for the rate. |
| BwEstimatorstr bwestimator_obj; |
| RateModel rate_data_obj; |
| double MaxDelay; |
| |
| /* 0 = adaptive; 1 = instantaneous */ |
| int16_t codingMode; |
| |
| // overall bottleneck of the codec |
| int32_t bottleneck; |
| |
| // QMF Filter state |
| int32_t analysisFBState1[FB_STATE_SIZE_WORD32]; |
| int32_t analysisFBState2[FB_STATE_SIZE_WORD32]; |
| int32_t synthesisFBState1[FB_STATE_SIZE_WORD32]; |
| int32_t synthesisFBState2[FB_STATE_SIZE_WORD32]; |
| |
| // Error Code |
| int16_t errorCode; |
| |
| // bandwidth of the encoded audio 8, 12 or 16 kHz |
| enum ISACBandwidth bandwidthKHz; |
| // Sampling rate of audio, encoder and decode, 8 or 16 kHz |
| enum IsacSamplingRate encoderSamplingRateKHz; |
| enum IsacSamplingRate decoderSamplingRateKHz; |
| // Flag to keep track of initializations, lower & upper-band |
| // encoder and decoder. |
| int16_t initFlag; |
| |
| // Flag to to indicate signal bandwidth switch |
| int16_t resetFlag_8kHz; |
| |
| // Maximum allowed rate, measured in Bytes per 30 ms. |
| int16_t maxRateBytesPer30Ms; |
| // Maximum allowed payload-size, measured in Bytes. |
| int16_t maxPayloadSizeBytes; |
| /* The expected sampling rate of the input signal. Valid values are 16000 |
| * and 32000. This is not the operation sampling rate of the codec. */ |
| uint16_t in_sample_rate_hz; |
| |
| // Trig tables for WebRtcIsac_Time2Spec and WebRtcIsac_Spec2time. |
| TransformTables transform_tables; |
| } ISACMainStruct; |
| |
| #endif /* MODULES_AUDIO_CODING_CODECS_ISAC_MAIN_SOURCE_STRUCTS_H_ */ |