1
0
mirror of https://github.com/FFmpeg/FFmpeg.git synced 2024-12-23 12:43:46 +02:00

af_hdcd: Process stereo channels together, fix #5727

Issue #5727: gain adjustment should only be applied if matching
gain value from a valid packet in both channels. The existing functions process
each channel separately, so it was not possible.

* New versions of hdcd_process(), hdcd_scan(), hdcd_integrate() named
  hdcd_*_stereo() that process both channels together.
* target_gain applied will be the last matching target_gain.
* The old single channel functions remain as an option. They can be
  used by: -af hdcd=process_stereo=0.

Signed-off-by: Burt P <pburt0@gmail.com>
Signed-off-by: Michael Niedermayer <michael@niedermayer.cc>
This commit is contained in:
Burt P 2016-08-01 14:28:39 -05:00 committed by Michael Niedermayer
parent 517dd04f6d
commit d574e22659

View File

@ -863,10 +863,22 @@ static const char * const pe_str[] = {
"enabled permanently" "enabled permanently"
}; };
#define HDCD_PROCESS_STEREO_DEFAULT 1
#define HDCD_MAX_CHANNELS 2
/* convert to float from 4-bit (3.1) fixed-point
* the always-negative value is stored positive, so make it negative */
#define GAINTOFLOAT(g) (g) ? -(float)(g>>1) - ((g & 1) ? 0.5 : 0.0) : 0.0
typedef struct HDCDContext { typedef struct HDCDContext {
const AVClass *class; const AVClass *class;
hdcd_state_t state[2]; hdcd_state_t state[HDCD_MAX_CHANNELS];
/* use hdcd_*_stereo() functions to process both channels together.
* -af hdcd=process_stereo=0 for off
* -af hdcd=process_stereo=1 for on
* default is HDCD_PROCESS_STEREO_DEFAULT */
int process_stereo;
/* always extend peaks above -3dBFS even if PE isn't signaled /* always extend peaks above -3dBFS even if PE isn't signaled
* -af hdcd=force_pe=0 for off * -af hdcd=force_pe=0 for off
* -af hdcd=force_pe=1 for on * -af hdcd=force_pe=1 for on
@ -875,6 +887,7 @@ typedef struct HDCDContext {
AVFilterContext *fctx; /* filter context for logging errors */ AVFilterContext *fctx; /* filter context for logging errors */
int sample_count; /* used in error logging */ int sample_count; /* used in error logging */
int val_target_gain; /* last matching target_gain in both channels */
/* User information/stats */ /* User information/stats */
int hdcd_detected; int hdcd_detected;
@ -886,9 +899,11 @@ typedef struct HDCDContext {
#define OFFSET(x) offsetof(HDCDContext, x) #define OFFSET(x) offsetof(HDCDContext, x)
static const AVOption hdcd_options[] = { static const AVOption hdcd_options[] = {
{ "process_stereo", "Process stereo channels together. Only apply target_gain when both channels match.",
OFFSET(process_stereo), AV_OPT_TYPE_INT, { .i64 = HDCD_PROCESS_STEREO_DEFAULT }, 0, 1, 0 },
{ "force_pe", "Always extend peaks above -3dBFS even when PE is not signaled.", { "force_pe", "Always extend peaks above -3dBFS even when PE is not signaled.",
OFFSET(force_pe), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, 0 }, OFFSET(force_pe), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, 0 },
{NULL} {NULL}
}; };
AVFILTER_DEFINE_CLASS(hdcd); AVFILTER_DEFINE_CLASS(hdcd);
@ -915,12 +930,10 @@ static void hdcd_reset(hdcd_state_t *state, unsigned rate)
state->code_counterB_checkfails = 0; state->code_counterB_checkfails = 0;
state->code_counterC = 0; state->code_counterC = 0;
state->code_counterC_unmatched = 0; state->code_counterC_unmatched = 0;
state->count_peak_extend = 0; state->count_peak_extend = 0;
state->count_transient_filter = 0; state->count_transient_filter = 0;
for(i = 0; i < 16; i++) state->gain_counts[i] = 0; for(i = 0; i < 16; i++) state->gain_counts[i] = 0;
state->max_gain = 0; state->max_gain = 0;
state->count_sustain_expired = -1; state->count_sustain_expired = -1;
} }
@ -1037,6 +1050,76 @@ static int hdcd_integrate(HDCDContext *ctx, hdcd_state_t *state, int *flag, cons
return result; return result;
} }
static int hdcd_integrate_stereo(HDCDContext *ctx, int *flag, const int32_t *samples, int count)
{
uint32_t bits[2] = {0, 0};
int result;
int i;
*flag = 0;
/* result = min(count, s0ra, s1ra) */
result = FFMIN(ctx->state[0].readahead, count);
result = FFMIN(ctx->state[1].readahead, result);
for (i = result - 1; i >= 0; i--) {
bits[0] |= (*(samples++) & 1) << i;
bits[1] |= (*(samples++) & 1) << i;
}
for (i = 0; i < 2; i++) {
ctx->state[i].window = (ctx->state[i].window << result) | bits[i];
ctx->state[i].readahead -= result;
if (ctx->state[i].readahead == 0) {
uint32_t wbits = (ctx->state[i].window ^ ctx->state[i].window >> 5 ^ ctx->state[i].window >> 23);
if (ctx->state[i].arg) {
switch (hdcd_code(wbits, &ctx->state[i].control)) {
case HDCD_CODE_A:
*flag |= i+1;
ctx->state[i].code_counterA++;
break;
case HDCD_CODE_B:
*flag |= i+1;
ctx->state[i].code_counterB++;
break;
case HDCD_CODE_A_ALMOST:
ctx->state[i].code_counterA_almost++;
av_log(ctx->fctx, AV_LOG_VERBOSE,
"hdcd error: Control A almost: 0x%02x near %d\n", wbits & 0xff, ctx->sample_count);
break;
case HDCD_CODE_B_CHECKFAIL:
ctx->state[i].code_counterB_checkfails++;
av_log(ctx->fctx, AV_LOG_VERBOSE,
"hdcd error: Control B check failed: 0x%04x (0x%02x vs 0x%02x) near %d\n", wbits & 0xffff, (wbits & 0xff00) >> 8, ~wbits & 0xff, ctx->sample_count);
break;
case HDCD_CODE_NONE:
ctx->state[i].code_counterC_unmatched++;
av_log(ctx->fctx, AV_LOG_VERBOSE,
"hdcd error: Unmatched code: 0x%08x near %d\n", wbits, ctx->sample_count);
default:
av_log(ctx->fctx, AV_LOG_INFO,
"hdcd error: Unexpected return value from hdcd_code()\n");
av_assert0(0); /* die */
}
if (*flag&(i+1)) hdcd_update_info(&ctx->state[i]);
ctx->state[i].arg = 0;
}
if (wbits == 0x7e0fa005 || wbits == 0x7e0fa006) {
/* 0x7e0fa00[.]-> [0b0101 or 0b0110] */
ctx->state[i].readahead = (wbits & 3) * 8;
ctx->state[i].arg = 1;
ctx->state[i].code_counterC++;
} else {
if (wbits)
ctx->state[i].readahead = readaheadtab[wbits & 0xff];
else
ctx->state[i].readahead = 31; /* ffwd over digisilence */
}
}
}
return result;
}
static void hdcd_sustain_reset(hdcd_state_t *state) static void hdcd_sustain_reset(hdcd_state_t *state)
{ {
state->sustain = state->sustain_reset; state->sustain = state->sustain_reset;
@ -1048,9 +1131,9 @@ static void hdcd_sustain_reset(hdcd_state_t *state)
static int hdcd_scan(HDCDContext *ctx, hdcd_state_t *state, const int32_t *samples, int max, int stride) static int hdcd_scan(HDCDContext *ctx, hdcd_state_t *state, const int32_t *samples, int max, int stride)
{ {
int result;
int cdt_active = 0; int cdt_active = 0;
/* code detect timer */ /* code detect timer */
int result;
if (state->sustain > 0) { if (state->sustain > 0) {
cdt_active = 1; cdt_active = 1;
if (state->sustain <= max) { if (state->sustain <= max) {
@ -1059,6 +1142,7 @@ static int hdcd_scan(HDCDContext *ctx, hdcd_state_t *state, const int32_t *sampl
} }
state->sustain -= max; state->sustain -= max;
} }
result = 0; result = 0;
while (result < max) { while (result < max) {
int flag; int flag;
@ -1074,6 +1158,48 @@ static int hdcd_scan(HDCDContext *ctx, hdcd_state_t *state, const int32_t *sampl
/* code detect timer expired */ /* code detect timer expired */
if (cdt_active && state->sustain == 0) if (cdt_active && state->sustain == 0)
state->count_sustain_expired++; state->count_sustain_expired++;
return result;
}
static int hdcd_scan_stereo(HDCDContext *ctx, const int32_t *samples, int max)
{
int result;
int i;
int cdt_active[2] = {0, 0};
/* code detect timers for each channel */
for(i=0; i<2; i++) {
if (ctx->state[i].sustain > 0) {
cdt_active[i] = 1;
if (ctx->state[i].sustain <= max) {
ctx->state[i].control = 0;
max = ctx->state[i].sustain;
}
ctx->state[i].sustain -= max;
}
}
result = 0;
while (result < max) {
int flag;
int consumed = hdcd_integrate_stereo(ctx, &flag, samples, max - result);
result += consumed;
if (flag) {
/* reset timer if code detected in a channel */
if (flag & 1) hdcd_sustain_reset(&ctx->state[0]);
if (flag & 2) hdcd_sustain_reset(&ctx->state[1]);
break;
}
samples += consumed * 2;
}
for(i=0; i<2; i++) {
/* code detect timer expired */
if (cdt_active[i] && ctx->state[i].sustain == 0)
ctx->state[i].count_sustain_expired++;
}
return result; return result;
} }
@ -1143,6 +1269,30 @@ static void hdcd_control(HDCDContext *ctx, hdcd_state_t *state, int *peak_extend
*target_gain = (state->control & 15) << 7; *target_gain = (state->control & 15) << 7;
} }
typedef enum {
HDCD_OK=0,
HDCD_TG_MISMATCH
} hdcd_control_result_t;
static hdcd_control_result_t hdcd_control_stereo(HDCDContext *ctx, int *peak_extend0, int *peak_extend1)
{
int target_gain[2];
hdcd_control(ctx, &ctx->state[0], peak_extend0, &target_gain[0]);
hdcd_control(ctx, &ctx->state[1], peak_extend1, &target_gain[1]);
if (target_gain[0] == target_gain[1])
ctx->val_target_gain = target_gain[0];
else {
av_log(ctx->fctx, AV_LOG_VERBOSE,
"hdcd error: Unmatched target_gain near %d: tg0: %0.1f, tg1: %0.1f, lvg: %0.1f\n",
ctx->sample_count,
GAINTOFLOAT(target_gain[0] >>7),
GAINTOFLOAT(target_gain[1] >>7),
GAINTOFLOAT(ctx->val_target_gain >>7) );
return HDCD_TG_MISMATCH;
}
return HDCD_OK;
}
static void hdcd_process(HDCDContext *ctx, hdcd_state_t *state, int32_t *samples, int count, int stride) static void hdcd_process(HDCDContext *ctx, hdcd_state_t *state, int32_t *samples, int count, int stride)
{ {
int32_t *samples_end = samples + count * stride; int32_t *samples_end = samples + count * stride;
@ -1175,9 +1325,44 @@ static void hdcd_process(HDCDContext *ctx, hdcd_state_t *state, int32_t *samples
state->running_gain = gain; state->running_gain = gain;
} }
/* convert to float from 4-bit (3.1) fixed-point static void hdcd_process_stereo(HDCDContext *ctx, int32_t *samples, int count)
* the always-negative value is stored positive, so make it negative */ {
#define GAINTOFLOAT(g) (g) ? -(float)(g>>1) - ((g & 1) ? 0.5 : 0.0) : 0.0 const int stride = 2;
int32_t *samples_end = samples + count * stride;
int gain[2] = {ctx->state[0].running_gain, ctx->state[1].running_gain};
int peak_extend[2];
int lead = 0;
hdcd_control_stereo(ctx, &peak_extend[0], &peak_extend[1]);
while (count > lead) {
int envelope_run, run;
av_assert0(samples + lead * stride + stride * (count - lead) <= samples_end);
run = hdcd_scan_stereo(ctx, samples + lead * stride, count - lead) + lead;
envelope_run = run - 1;
av_assert0(samples + envelope_run * stride <= samples_end);
if (envelope_run) {
gain[0] = hdcd_envelope(samples, envelope_run, stride, gain[0], ctx->val_target_gain, peak_extend[0]);
gain[1] = hdcd_envelope(samples + 1, envelope_run, stride, gain[1], ctx->val_target_gain, peak_extend[1]);
}
samples += envelope_run * stride;
count -= envelope_run;
lead = run - envelope_run;
hdcd_control_stereo(ctx, &peak_extend[0], &peak_extend[1]);
}
if (lead > 0) {
av_assert0(samples + lead * stride <= samples_end);
gain[0] = hdcd_envelope(samples, lead, stride, gain[0], ctx->val_target_gain, peak_extend[0]);
gain[1] = hdcd_envelope(samples + 1, lead, stride, gain[1], ctx->val_target_gain, peak_extend[1]);
}
ctx->state[0].running_gain = gain[0];
ctx->state[1].running_gain = gain[1];
}
static int filter_frame(AVFilterLink *inlink, AVFrame *in) static int filter_frame(AVFilterLink *inlink, AVFrame *in)
{ {
@ -1188,7 +1373,6 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *in)
const int16_t *in_data; const int16_t *in_data;
int32_t *out_data; int32_t *out_data;
int n, c; int n, c;
int detect, packets, pe_packets;
out = ff_get_audio_buffer(outlink, in->nb_samples); out = ff_get_audio_buffer(outlink, in->nb_samples);
if (!out) { if (!out) {
@ -1204,35 +1388,60 @@ static int filter_frame(AVFilterLink *inlink, AVFrame *in)
out_data[n] = in_data[n]; out_data[n] = in_data[n];
} }
detect = 0; s->det_errors = 0; /* re-sum every pass */
packets = 0; if (s->process_stereo && inlink->channels == 2) {
pe_packets = 0; float mga = 0.0;
s->det_errors = 0; hdcd_process_stereo(s, out_data, in->nb_samples);
for (c = 0; c < inlink->channels; c++) { /* HDCD is detected if a valid packet is active in both
hdcd_state_t *state = &s->state[c]; * channels at the same time. */
hdcd_process(s, state, out_data + c, in->nb_samples, out->channels); if (s->state[0].sustain && s->state[1].sustain) s->hdcd_detected = 1;
if (state->sustain) detect++; if (s->state[0].count_peak_extend || s->state[1].count_peak_extend) {
packets += state->code_counterA + state->code_counterB; int packets = s->state[0].code_counterA
pe_packets += state->count_peak_extend; + s->state[0].code_counterB
s->uses_transient_filter |= !!state->count_transient_filter; + s->state[1].code_counterA
s->max_gain_adjustment = FFMIN(s->max_gain_adjustment, GAINTOFLOAT(state->max_gain)); + s->state[1].code_counterB;
s->det_errors += state->code_counterA_almost /* if every valid packet has used PE, call it permanent */
+ state->code_counterB_checkfails if (packets == s->state[0].count_peak_extend + s->state[1].count_peak_extend)
+ state->code_counterC_unmatched; s->peak_extend = HDCD_PE_PERMANENT;
} else
if (pe_packets) { s->peak_extend = HDCD_PE_INTERMITTENT;
/* if every valid packet has used PE, call it permanent */ } else s->peak_extend = HDCD_PE_NEVER;
if (packets == pe_packets) s->uses_transient_filter = (s->state[0].count_transient_filter || s->state[1].count_transient_filter);
s->peak_extend = HDCD_PE_PERMANENT; mga = FFMIN(GAINTOFLOAT(s->state[0].max_gain), GAINTOFLOAT(s->state[1].max_gain));
else s->max_gain_adjustment = FFMIN(s->max_gain_adjustment, mga);
s->peak_extend = HDCD_PE_INTERMITTENT; s->det_errors += s->state[0].code_counterA_almost
+ s->state[0].code_counterB_checkfails
+ s->state[0].code_counterC_unmatched
+ s->state[1].code_counterA_almost
+ s->state[1].code_counterB_checkfails
+ s->state[1].code_counterC_unmatched;
} else { } else {
s->peak_extend = HDCD_PE_NEVER; int detect=0;
int packets=0;
int pe_packets=0;
for (c = 0; c < inlink->channels; c++) {
hdcd_state_t *state = &s->state[c];
hdcd_process(s, state, out_data + c, in->nb_samples, out->channels);
if (state->sustain) detect++;
packets += state->code_counterA + state->code_counterB;
pe_packets += state->count_peak_extend;
s->uses_transient_filter |= !!(state->count_transient_filter);
s->max_gain_adjustment = FFMIN(s->max_gain_adjustment, GAINTOFLOAT(state->max_gain));
s->det_errors += state->code_counterA_almost
+ state->code_counterB_checkfails
+ state->code_counterC_unmatched;
}
if (pe_packets) {
/* if every valid packet has used PE, call it permanent */
if (packets == pe_packets)
s->peak_extend = HDCD_PE_PERMANENT;
else
s->peak_extend = HDCD_PE_INTERMITTENT;
} else s->peak_extend = HDCD_PE_NEVER;
/* HDCD is detected if a valid packet is active in all
* channels at the same time. */
if (detect == inlink->channels) s->hdcd_detected = 1;
} }
/* HDCD is detected if a valid packet is active in all (both)
* channels at the same time. */
if (detect == inlink->channels) s->hdcd_detected = 1;
s->sample_count += in->nb_samples * in->channels; s->sample_count += in->nb_samples * in->channels;
av_frame_free(&in); av_frame_free(&in);
@ -1291,7 +1500,7 @@ static av_cold void uninit(AVFilterContext *ctx)
int i, j; int i, j;
/* dump the state for each channel for AV_LOG_VERBOSE */ /* dump the state for each channel for AV_LOG_VERBOSE */
for (i = 0; i < 2; i++) { for (i = 0; i < HDCD_MAX_CHANNELS; i++) {
hdcd_state_t *state = &s->state[i]; hdcd_state_t *state = &s->state[i];
av_log(ctx, AV_LOG_VERBOSE, "Channel %d: counter A: %d, B: %d, C: %d\n", i, av_log(ctx, AV_LOG_VERBOSE, "Channel %d: counter A: %d, B: %d, C: %d\n", i,
state->code_counterA, state->code_counterB, state->code_counterC); state->code_counterA, state->code_counterB, state->code_counterC);
@ -1330,10 +1539,12 @@ static av_cold int init(AVFilterContext *ctx)
s->sample_count = 0; s->sample_count = 0;
s->fctx = ctx; s->fctx = ctx;
for (c = 0; c < 2; c++) { for (c = 0; c < HDCD_MAX_CHANNELS; c++) {
hdcd_reset(&s->state[c], 44100); hdcd_reset(&s->state[c], 44100);
} }
av_log(ctx, AV_LOG_VERBOSE, "Process mode: %s\n",
(s->process_stereo) ? "process stereo channels together" : "process each channel separately");
av_log(ctx, AV_LOG_VERBOSE, "Force PE: %s\n", av_log(ctx, AV_LOG_VERBOSE, "Force PE: %s\n",
(s->force_pe) ? "on" : "off"); (s->force_pe) ? "on" : "off");