2 * Opus decoder/demuxer common functions
3 * Copyright (c) 2012 Andrew D'Addesio
4 * Copyright (c) 2013-2014 Mozilla Corporation
6 * This file is part of FFmpeg.
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
23 #ifndef AVCODEC_OPUS_H
24 #define AVCODEC_OPUS_H
28 #include "libavutil/audio_fifo.h"
29 #include "libavutil/float_dsp.h"
30 #include "libavutil/frame.h"
32 #include "libswresample/swresample.h"
37 #define MAX_FRAME_SIZE 1275
39 #define MAX_PACKET_DUR 5760
41 #define CELT_SHORT_BLOCKSIZE 120
42 #define CELT_OVERLAP CELT_SHORT_BLOCKSIZE
43 #define CELT_MAX_LOG_BLOCKS 3
44 #define CELT_MAX_FRAME_SIZE (CELT_SHORT_BLOCKSIZE * (1 << CELT_MAX_LOG_BLOCKS))
45 #define CELT_MAX_BANDS 21
47 #define SILK_HISTORY 322
48 #define SILK_MAX_LPC 16
50 #define ROUND_MULL(a,b,s) (((MUL64(a, b) >> ((s) - 1)) + 1) >> 1)
51 #define ROUND_MUL16(a,b) ((MUL16(a, b) + 16384) >> 15)
53 #define OPUS_TS_HEADER 0x7FE0 // 0x3ff (11 bits)
54 #define OPUS_TS_MASK 0xFFE0 // top 11 bits
56 static const uint8_t opus_default_extradata[30] = {
57 'O', 'p', 'u', 's', 'H', 'e', 'a', 'd',
58 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
59 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
69 OPUS_BANDWIDTH_NARROWBAND,
70 OPUS_BANDWIDTH_MEDIUMBAND,
71 OPUS_BANDWIDTH_WIDEBAND,
72 OPUS_BANDWIDTH_SUPERWIDEBAND,
73 OPUS_BANDWIDTH_FULLBAND
76 typedef struct SilkContext SilkContext;
78 typedef struct CeltContext CeltContext;
80 typedef struct OpusPacket {
81 int packet_size; /**< packet size */
82 int data_size; /**< size of the useful data -- packet size - padding */
83 int code; /**< packet code: specifies the frame layout */
84 int stereo; /**< whether this packet is mono or stereo */
85 int vbr; /**< vbr flag */
86 int config; /**< configuration: tells the audio mode,
87 ** bandwidth, and frame duration */
88 int frame_count; /**< frame count */
89 int frame_offset[MAX_FRAMES]; /**< frame offsets */
90 int frame_size[MAX_FRAMES]; /**< frame sizes */
91 int frame_duration; /**< frame duration, in samples @ 48kHz */
92 enum OpusMode mode; /**< mode */
93 enum OpusBandwidth bandwidth; /**< bandwidth */
96 typedef struct OpusStreamContext {
97 AVCodecContext *avctx;
101 OpusRangeCoder redundancy_rc;
104 AVFloatDSPContext *fdsp;
106 float silk_buf[2][960];
107 float *silk_output[2];
108 DECLARE_ALIGNED(32, float, celt_buf)[2][960];
109 float *celt_output[2];
111 float redundancy_buf[2][960];
112 float *redundancy_output[2];
114 /* data buffers for the final output data */
119 int out_dummy_allocated_size;
122 AVAudioFifo *celt_delay;
124 /* number of samples we still want to get from the resampler */
132 // a mapping between an opus stream and an output channel
133 typedef struct ChannelMap {
137 // when a single decoded channel is mapped to multiple output channels, we
138 // write to the first output directly and copy from it to the others
139 // this field is set to 1 for those copied output channels
141 // this is the index of the output channel to copy from
144 // this channel is silent
148 typedef struct OpusContext {
149 OpusStreamContext *streams;
151 /* current output buffers for each streams */
154 /* Buffers for synchronizing the streams when they have different
155 * resampling delays */
156 AVAudioFifo **sync_buffers;
157 /* number of decoded samples for each stream */
158 int *decoded_samples;
161 int nb_stereo_streams;
163 AVFloatDSPContext *fdsp;
167 ChannelMap *channel_maps;
170 int ff_opus_parse_packet(OpusPacket *pkt, const uint8_t *buf, int buf_size,
173 int ff_opus_parse_extradata(AVCodecContext *avctx, OpusContext *s);
175 int ff_silk_init(AVCodecContext *avctx, SilkContext **ps, int output_channels);
176 void ff_silk_free(SilkContext **ps);
177 void ff_silk_flush(SilkContext *s);
180 * Decode the LP layer of one Opus frame (which may correspond to several SILK
183 int ff_silk_decode_superframe(SilkContext *s, OpusRangeCoder *rc,
185 enum OpusBandwidth bandwidth, int coded_channels,
188 int ff_celt_init(AVCodecContext *avctx, CeltContext **s, int output_channels);
190 void ff_celt_free(CeltContext **s);
192 void ff_celt_flush(CeltContext *s);
194 int ff_celt_decode_frame(CeltContext *s, OpusRangeCoder *rc,
195 float **output, int coded_channels, int frame_size,
196 int startband, int endband);
198 #endif /* AVCODEC_OPUS_H */