mirror of
https://github.com/FFmpeg/FFmpeg.git
synced 2024-12-18 03:19:31 +02:00
20f9727018
Up until now, codec.h contains both public and private parts of AVCodec. This exposes the internals of AVCodec to users and leads them into the temptation of actually using them and forces us to forward-declare structures and types that users can't use at all. This commit changes this by adding a new structure FFCodec to codec_internal.h that extends AVCodec, i.e. contains the public AVCodec as first member; the private fields of AVCodec are moved to this structure, leaving codec.h clean. Reviewed-by: Anton Khirnov <anton@khirnov.net> Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
204 lines
5.8 KiB
C
204 lines
5.8 KiB
C
/*
|
|
* RoQ audio encoder
|
|
*
|
|
* Copyright (c) 2005 Eric Lasota
|
|
* Based on RoQ specs (c)2001 Tim Ferguson
|
|
*
|
|
* This file is part of FFmpeg.
|
|
*
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
*
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Lesser General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*/
|
|
|
|
#include "avcodec.h"
|
|
#include "bytestream.h"
|
|
#include "codec_internal.h"
|
|
#include "encode.h"
|
|
#include "mathops.h"
|
|
|
|
#define ROQ_FRAME_SIZE 735
|
|
#define ROQ_HEADER_SIZE 8
|
|
|
|
#define MAX_DPCM (127*127)
|
|
|
|
|
|
typedef struct ROQDPCMContext {
|
|
short lastSample[2];
|
|
int input_frames;
|
|
int buffered_samples;
|
|
int16_t *frame_buffer;
|
|
int64_t first_pts;
|
|
} ROQDPCMContext;
|
|
|
|
|
|
static av_cold int roq_dpcm_encode_close(AVCodecContext *avctx)
|
|
{
|
|
ROQDPCMContext *context = avctx->priv_data;
|
|
|
|
av_freep(&context->frame_buffer);
|
|
|
|
return 0;
|
|
}
|
|
|
|
static av_cold int roq_dpcm_encode_init(AVCodecContext *avctx)
|
|
{
|
|
ROQDPCMContext *context = avctx->priv_data;
|
|
int channels = avctx->ch_layout.nb_channels;
|
|
|
|
if (channels > 2) {
|
|
av_log(avctx, AV_LOG_ERROR, "Audio must be mono or stereo\n");
|
|
return AVERROR(EINVAL);
|
|
}
|
|
if (avctx->sample_rate != 22050) {
|
|
av_log(avctx, AV_LOG_ERROR, "Audio must be 22050 Hz\n");
|
|
return AVERROR(EINVAL);
|
|
}
|
|
|
|
avctx->frame_size = ROQ_FRAME_SIZE;
|
|
avctx->bit_rate = (ROQ_HEADER_SIZE + ROQ_FRAME_SIZE * channels) *
|
|
(22050 / ROQ_FRAME_SIZE) * 8;
|
|
|
|
context->frame_buffer = av_malloc(8 * ROQ_FRAME_SIZE * channels *
|
|
sizeof(*context->frame_buffer));
|
|
if (!context->frame_buffer)
|
|
return AVERROR(ENOMEM);
|
|
|
|
context->lastSample[0] = context->lastSample[1] = 0;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static unsigned char dpcm_predict(short *previous, short current)
|
|
{
|
|
int diff;
|
|
int negative;
|
|
int result;
|
|
int predicted;
|
|
|
|
diff = current - *previous;
|
|
|
|
negative = diff<0;
|
|
diff = FFABS(diff);
|
|
|
|
if (diff >= MAX_DPCM)
|
|
result = 127;
|
|
else {
|
|
result = ff_sqrt(diff);
|
|
result += diff > result*result+result;
|
|
}
|
|
|
|
/* See if this overflows */
|
|
retry:
|
|
diff = result*result;
|
|
if (negative)
|
|
diff = -diff;
|
|
predicted = *previous + diff;
|
|
|
|
/* If it overflows, back off a step */
|
|
if (predicted > 32767 || predicted < -32768) {
|
|
result--;
|
|
goto retry;
|
|
}
|
|
|
|
/* Add the sign bit */
|
|
result |= negative << 7; //if (negative) result |= 128;
|
|
|
|
*previous = predicted;
|
|
|
|
return result;
|
|
}
|
|
|
|
static int roq_dpcm_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
|
|
const AVFrame *frame, int *got_packet_ptr)
|
|
{
|
|
int i, stereo, data_size, ret;
|
|
const int16_t *in = frame ? (const int16_t *)frame->data[0] : NULL;
|
|
int channels = avctx->ch_layout.nb_channels;
|
|
uint8_t *out;
|
|
ROQDPCMContext *context = avctx->priv_data;
|
|
|
|
stereo = (channels == 2);
|
|
|
|
if (!in && context->input_frames >= 8)
|
|
return 0;
|
|
|
|
if (in && context->input_frames < 8) {
|
|
memcpy(&context->frame_buffer[context->buffered_samples * channels],
|
|
in, avctx->frame_size * channels * sizeof(*in));
|
|
context->buffered_samples += avctx->frame_size;
|
|
if (context->input_frames == 0)
|
|
context->first_pts = frame->pts;
|
|
if (context->input_frames < 7) {
|
|
context->input_frames++;
|
|
return 0;
|
|
}
|
|
}
|
|
if (context->input_frames < 8)
|
|
in = context->frame_buffer;
|
|
|
|
if (stereo) {
|
|
context->lastSample[0] &= 0xFF00;
|
|
context->lastSample[1] &= 0xFF00;
|
|
}
|
|
|
|
if (context->input_frames == 7)
|
|
data_size = channels * context->buffered_samples;
|
|
else
|
|
data_size = channels * avctx->frame_size;
|
|
|
|
ret = ff_get_encode_buffer(avctx, avpkt, ROQ_HEADER_SIZE + data_size, 0);
|
|
if (ret < 0)
|
|
return ret;
|
|
out = avpkt->data;
|
|
|
|
bytestream_put_byte(&out, stereo ? 0x21 : 0x20);
|
|
bytestream_put_byte(&out, 0x10);
|
|
bytestream_put_le32(&out, data_size);
|
|
|
|
if (stereo) {
|
|
bytestream_put_byte(&out, (context->lastSample[1])>>8);
|
|
bytestream_put_byte(&out, (context->lastSample[0])>>8);
|
|
} else
|
|
bytestream_put_le16(&out, context->lastSample[0]);
|
|
|
|
/* Write the actual samples */
|
|
for (i = 0; i < data_size; i++)
|
|
*out++ = dpcm_predict(&context->lastSample[i & 1], *in++);
|
|
|
|
avpkt->pts = context->input_frames <= 7 ? context->first_pts : frame->pts;
|
|
avpkt->duration = data_size / channels;
|
|
|
|
context->input_frames++;
|
|
if (!in)
|
|
context->input_frames = FFMAX(context->input_frames, 8);
|
|
|
|
*got_packet_ptr = 1;
|
|
return 0;
|
|
}
|
|
|
|
const FFCodec ff_roq_dpcm_encoder = {
|
|
.p.name = "roq_dpcm",
|
|
.p.long_name = NULL_IF_CONFIG_SMALL("id RoQ DPCM"),
|
|
.p.type = AVMEDIA_TYPE_AUDIO,
|
|
.p.id = AV_CODEC_ID_ROQ_DPCM,
|
|
.p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY,
|
|
.priv_data_size = sizeof(ROQDPCMContext),
|
|
.init = roq_dpcm_encode_init,
|
|
.encode2 = roq_dpcm_encode_frame,
|
|
.close = roq_dpcm_encode_close,
|
|
.p.sample_fmts = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_S16,
|
|
AV_SAMPLE_FMT_NONE },
|
|
.caps_internal = FF_CODEC_CAP_INIT_THREADSAFE,
|
|
};
|