| /* Copyright (c) 2011 Xiph.Org Foundation |
| Written by Jean-Marc Valin */ |
| /* |
| Redistribution and use in source and binary forms, with or without |
| modification, are permitted provided that the following conditions |
| are met: |
| |
| - Redistributions of source code must retain the above copyright |
| notice, this list of conditions and the following disclaimer. |
| |
| - Redistributions in binary form must reproduce the above copyright |
| notice, this list of conditions and the following disclaimer in the |
| documentation and/or other materials provided with the distribution. |
| |
| THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
| ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
| LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
| A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE FOUNDATION OR |
| CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
| EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
| PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
| PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF |
| LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING |
| NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| */ |
| |
| #ifndef ANALYSIS_H |
| #define ANALYSIS_H |
| |
| #include "celt.h" |
| #include "opus_private.h" |
| |
| #define NB_FRAMES 8 |
| #define NB_TBANDS 18 |
| #define NB_TOT_BANDS 21 |
| #define ANALYSIS_BUF_SIZE 720 /* 15 ms at 48 kHz */ |
| |
| #define DETECT_SIZE 200 |
| |
| typedef struct { |
| float angle[240]; |
| float d_angle[240]; |
| float d2_angle[240]; |
| opus_val32 inmem[ANALYSIS_BUF_SIZE]; |
| int mem_fill; /* number of usable samples in the buffer */ |
| float prev_band_tonality[NB_TBANDS]; |
| float prev_tonality; |
| float E[NB_FRAMES][NB_TBANDS]; |
| float lowE[NB_TBANDS]; |
| float highE[NB_TBANDS]; |
| float meanE[NB_TOT_BANDS]; |
| float mem[32]; |
| float cmean[8]; |
| float std[9]; |
| float music_prob; |
| float Etracker; |
| float lowECount; |
| int E_count; |
| int last_music; |
| int last_transition; |
| int count; |
| float subframe_mem[3]; |
| int analysis_offset; |
| /** Probability of having speech for time i to DETECT_SIZE-1 (and music before). |
| pspeech[0] is the probability that all frames in the window are speech. */ |
| float pspeech[DETECT_SIZE]; |
| /** Probability of having music for time i to DETECT_SIZE-1 (and speech before). |
| pmusic[0] is the probability that all frames in the window are music. */ |
| float pmusic[DETECT_SIZE]; |
| float speech_confidence; |
| float music_confidence; |
| int speech_confidence_count; |
| int music_confidence_count; |
| int write_pos; |
| int read_pos; |
| int read_subframe; |
| AnalysisInfo info[DETECT_SIZE]; |
| } TonalityAnalysisState; |
| |
| void tonality_analysis(TonalityAnalysisState *tonal, AnalysisInfo *info, |
| const CELTMode *celt_mode, const void *x, int len, int offset, int c1, int c2, int C, int lsb_depth, downmix_func downmix); |
| |
| void tonality_get_info(TonalityAnalysisState *tonal, AnalysisInfo *info_out, int len); |
| |
| void run_analysis(TonalityAnalysisState *analysis, const CELTMode *celt_mode, const void *analysis_pcm, |
| int analysis_frame_size, int frame_size, int c1, int c2, int C, opus_int32 Fs, |
| int lsb_depth, downmix_func downmix, AnalysisInfo *analysis_info); |
| |
| #endif |