2017-01-24 16:34:29 +01:00
|
|
|
/*
|
|
|
|
* SCC subtitle demuxer
|
|
|
|
* Copyright (c) 2017 Paul B Mahol
|
|
|
|
*
|
|
|
|
* This file is part of FFmpeg.
|
|
|
|
*
|
|
|
|
* FFmpeg is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU Lesser General Public
|
|
|
|
* License as published by the Free Software Foundation; either
|
|
|
|
* version 2.1 of the License, or (at your option) any later version.
|
|
|
|
*
|
|
|
|
* FFmpeg is distributed in the hope that it will be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
|
|
* Lesser General Public License for more details.
|
|
|
|
*
|
|
|
|
* You should have received a copy of the GNU Lesser General Public
|
|
|
|
* License along with FFmpeg; if not, write to the Free Software
|
|
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
|
|
*/
|
|
|
|
|
|
|
|
#include "avformat.h"
|
2024-02-10 15:50:43 +01:00
|
|
|
#include "demux.h"
|
2017-01-24 16:34:29 +01:00
|
|
|
#include "internal.h"
|
|
|
|
#include "subtitles.h"
|
2020-02-04 20:37:26 +01:00
|
|
|
#include "libavutil/avstring.h"
|
2017-01-24 16:34:29 +01:00
|
|
|
#include "libavutil/intreadwrite.h"
|
|
|
|
|
|
|
|
typedef struct SCCContext {
|
|
|
|
FFDemuxSubtitlesQueue q;
|
|
|
|
} SCCContext;
|
|
|
|
|
2019-03-21 01:18:37 +01:00
|
|
|
static int scc_probe(const AVProbeData *p)
|
2017-01-24 16:34:29 +01:00
|
|
|
{
|
2017-01-28 17:23:31 +01:00
|
|
|
char buf[18];
|
2017-01-24 16:34:29 +01:00
|
|
|
FFTextReader tr;
|
|
|
|
|
|
|
|
ff_text_init_buf(&tr, p->buf, p->buf_size);
|
|
|
|
|
|
|
|
while (ff_text_peek_r8(&tr) == '\r' || ff_text_peek_r8(&tr) == '\n')
|
|
|
|
ff_text_r8(&tr);
|
|
|
|
|
2017-01-28 17:23:31 +01:00
|
|
|
ff_text_read(&tr, buf, sizeof(buf));
|
2017-01-24 16:34:29 +01:00
|
|
|
|
|
|
|
if (!memcmp(buf, "Scenarist_SCC V1.0", 18))
|
|
|
|
return AVPROBE_SCORE_MAX;
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int convert(uint8_t x)
|
|
|
|
{
|
|
|
|
if (x >= 'a')
|
2021-10-01 15:30:30 +02:00
|
|
|
x -= 'a' - 10;
|
2017-01-24 16:34:29 +01:00
|
|
|
else if (x >= 'A')
|
2021-10-01 15:30:30 +02:00
|
|
|
x -= 'A' - 10;
|
2017-01-24 16:34:29 +01:00
|
|
|
else
|
|
|
|
x -= '0';
|
|
|
|
return x;
|
|
|
|
}
|
|
|
|
|
|
|
|
static int scc_read_header(AVFormatContext *s)
|
|
|
|
{
|
|
|
|
SCCContext *scc = s->priv_data;
|
|
|
|
AVStream *st = avformat_new_stream(s, NULL);
|
avformat/sccdec: Don't use uninitialized data, fix crash, simplify logic
Up until now, the scc demuxer not only read the line that it intends
to process, but also the next line, in order to be able to calculate
the duration of the current line. This approach leads to unnecessary
complexity and also to bugs: For the last line, the timing of the
next subtitle is not only logically indeterminate, but also
uninitialized and the same applies to the duration of the last packet
derived from it.* Worse yet, in case of e.g. an empty file, it is not
only the duration that is uninitialized, but the whole timing as well
as the line buffer itself.** The latter is used in av_strtok(), which
could lead to crashes. Furthermore, the current code always outputs
at least one packet, even for empty files.
This commit fixes all of this: It stops using two lines at a time;
instead only the current line is dealt with and in case there is
a packet after that, the duration of the last packet is fixed up
after having already parsed it; consequently the duration of the
last packet is left in its default state (meaning "unknown/up until
the next subtitle"). If no further line could be read, processing
is stopped; in particular, no packet is output for an empty file.
*: Due to stack reuse it seems to be zero quite often; for the same
reason Valgrind does not report any errors for a normal input file.
**: While ff_subtitles_read_line() claims to always zero-terminate
the buffer like snprintf(), it doesn't do so if it didn't read anything.
And even if it did, it would not necessarily help here: The current
code jumps over 12 bytes that it deems to have read even when it
hasn't.
Reviewed-by: Paul B Mahol <onemda@gmail.com>
Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
2021-10-01 11:57:34 +02:00
|
|
|
AVPacket *sub = NULL;
|
2020-06-16 19:13:42 +02:00
|
|
|
ptrdiff_t len;
|
2017-01-24 16:34:29 +01:00
|
|
|
uint8_t out[4096];
|
|
|
|
FFTextReader tr;
|
|
|
|
|
|
|
|
ff_text_init_avio(s, &tr, s->pb);
|
|
|
|
|
|
|
|
if (!st)
|
|
|
|
return AVERROR(ENOMEM);
|
|
|
|
avpriv_set_pts_info(st, 64, 1, 1000);
|
|
|
|
st->codecpar->codec_type = AVMEDIA_TYPE_SUBTITLE;
|
|
|
|
st->codecpar->codec_id = AV_CODEC_ID_EIA_608;
|
|
|
|
|
avformat/sccdec: Don't use uninitialized data, fix crash, simplify logic
Up until now, the scc demuxer not only read the line that it intends
to process, but also the next line, in order to be able to calculate
the duration of the current line. This approach leads to unnecessary
complexity and also to bugs: For the last line, the timing of the
next subtitle is not only logically indeterminate, but also
uninitialized and the same applies to the duration of the last packet
derived from it.* Worse yet, in case of e.g. an empty file, it is not
only the duration that is uninitialized, but the whole timing as well
as the line buffer itself.** The latter is used in av_strtok(), which
could lead to crashes. Furthermore, the current code always outputs
at least one packet, even for empty files.
This commit fixes all of this: It stops using two lines at a time;
instead only the current line is dealt with and in case there is
a packet after that, the duration of the last packet is fixed up
after having already parsed it; consequently the duration of the
last packet is left in its default state (meaning "unknown/up until
the next subtitle"). If no further line could be read, processing
is stopped; in particular, no packet is output for an empty file.
*: Due to stack reuse it seems to be zero quite often; for the same
reason Valgrind does not report any errors for a normal input file.
**: While ff_subtitles_read_line() claims to always zero-terminate
the buffer like snprintf(), it doesn't do so if it didn't read anything.
And even if it did, it would not necessarily help here: The current
code jumps over 12 bytes that it deems to have read even when it
hasn't.
Reviewed-by: Paul B Mahol <onemda@gmail.com>
Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
2021-10-01 11:57:34 +02:00
|
|
|
while (1) {
|
2017-01-24 16:34:29 +01:00
|
|
|
char *saveptr = NULL, *lline;
|
2020-06-16 19:13:42 +02:00
|
|
|
int hh, mm, ss, fs, i;
|
avformat/sccdec: Don't use uninitialized data, fix crash, simplify logic
Up until now, the scc demuxer not only read the line that it intends
to process, but also the next line, in order to be able to calculate
the duration of the current line. This approach leads to unnecessary
complexity and also to bugs: For the last line, the timing of the
next subtitle is not only logically indeterminate, but also
uninitialized and the same applies to the duration of the last packet
derived from it.* Worse yet, in case of e.g. an empty file, it is not
only the duration that is uninitialized, but the whole timing as well
as the line buffer itself.** The latter is used in av_strtok(), which
could lead to crashes. Furthermore, the current code always outputs
at least one packet, even for empty files.
This commit fixes all of this: It stops using two lines at a time;
instead only the current line is dealt with and in case there is
a packet after that, the duration of the last packet is fixed up
after having already parsed it; consequently the duration of the
last packet is left in its default state (meaning "unknown/up until
the next subtitle"). If no further line could be read, processing
is stopped; in particular, no packet is output for an empty file.
*: Due to stack reuse it seems to be zero quite often; for the same
reason Valgrind does not report any errors for a normal input file.
**: While ff_subtitles_read_line() claims to always zero-terminate
the buffer like snprintf(), it doesn't do so if it didn't read anything.
And even if it did, it would not necessarily help here: The current
code jumps over 12 bytes that it deems to have read even when it
hasn't.
Reviewed-by: Paul B Mahol <onemda@gmail.com>
Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
2021-10-01 11:57:34 +02:00
|
|
|
char line[4096];
|
|
|
|
int64_t pos, ts;
|
2017-01-24 16:34:29 +01:00
|
|
|
|
2021-10-01 15:20:47 +02:00
|
|
|
pos = ff_text_pos(&tr);
|
avformat/sccdec: Don't use uninitialized data, fix crash, simplify logic
Up until now, the scc demuxer not only read the line that it intends
to process, but also the next line, in order to be able to calculate
the duration of the current line. This approach leads to unnecessary
complexity and also to bugs: For the last line, the timing of the
next subtitle is not only logically indeterminate, but also
uninitialized and the same applies to the duration of the last packet
derived from it.* Worse yet, in case of e.g. an empty file, it is not
only the duration that is uninitialized, but the whole timing as well
as the line buffer itself.** The latter is used in av_strtok(), which
could lead to crashes. Furthermore, the current code always outputs
at least one packet, even for empty files.
This commit fixes all of this: It stops using two lines at a time;
instead only the current line is dealt with and in case there is
a packet after that, the duration of the last packet is fixed up
after having already parsed it; consequently the duration of the
last packet is left in its default state (meaning "unknown/up until
the next subtitle"). If no further line could be read, processing
is stopped; in particular, no packet is output for an empty file.
*: Due to stack reuse it seems to be zero quite often; for the same
reason Valgrind does not report any errors for a normal input file.
**: While ff_subtitles_read_line() claims to always zero-terminate
the buffer like snprintf(), it doesn't do so if it didn't read anything.
And even if it did, it would not necessarily help here: The current
code jumps over 12 bytes that it deems to have read even when it
hasn't.
Reviewed-by: Paul B Mahol <onemda@gmail.com>
Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
2021-10-01 11:57:34 +02:00
|
|
|
len = ff_subtitles_read_line(&tr, line, sizeof(line));
|
|
|
|
if (len <= 13) {
|
|
|
|
if (ff_text_eof(&tr))
|
|
|
|
break;
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
if (av_sscanf(line, "%d:%d:%d%*[:;]%d", &hh, &mm, &ss, &fs) != 4)
|
|
|
|
continue;
|
2017-01-24 16:34:29 +01:00
|
|
|
|
avformat/sccdec: Don't use uninitialized data, fix crash, simplify logic
Up until now, the scc demuxer not only read the line that it intends
to process, but also the next line, in order to be able to calculate
the duration of the current line. This approach leads to unnecessary
complexity and also to bugs: For the last line, the timing of the
next subtitle is not only logically indeterminate, but also
uninitialized and the same applies to the duration of the last packet
derived from it.* Worse yet, in case of e.g. an empty file, it is not
only the duration that is uninitialized, but the whole timing as well
as the line buffer itself.** The latter is used in av_strtok(), which
could lead to crashes. Furthermore, the current code always outputs
at least one packet, even for empty files.
This commit fixes all of this: It stops using two lines at a time;
instead only the current line is dealt with and in case there is
a packet after that, the duration of the last packet is fixed up
after having already parsed it; consequently the duration of the
last packet is left in its default state (meaning "unknown/up until
the next subtitle"). If no further line could be read, processing
is stopped; in particular, no packet is output for an empty file.
*: Due to stack reuse it seems to be zero quite often; for the same
reason Valgrind does not report any errors for a normal input file.
**: While ff_subtitles_read_line() claims to always zero-terminate
the buffer like snprintf(), it doesn't do so if it didn't read anything.
And even if it did, it would not necessarily help here: The current
code jumps over 12 bytes that it deems to have read even when it
hasn't.
Reviewed-by: Paul B Mahol <onemda@gmail.com>
Signed-off-by: Andreas Rheinhardt <andreas.rheinhardt@outlook.com>
2021-10-01 11:57:34 +02:00
|
|
|
ts = (hh * 3600LL + mm * 60LL + ss) * 1000LL + fs * 33LL;
|
|
|
|
if (sub)
|
|
|
|
sub->duration = ts - sub->pts;
|
2017-01-24 16:34:29 +01:00
|
|
|
|
2021-10-01 10:33:38 +02:00
|
|
|
lline = line;
|
2017-01-24 16:34:29 +01:00
|
|
|
lline += 12;
|
|
|
|
|
|
|
|
for (i = 0; i < 4095; i += 3) {
|
|
|
|
char *ptr = av_strtok(lline, " ", &saveptr);
|
|
|
|
char c1, c2, c3, c4;
|
2020-06-12 20:03:42 +02:00
|
|
|
uint8_t o1, o2;
|
2017-01-24 16:34:29 +01:00
|
|
|
|
|
|
|
if (!ptr)
|
|
|
|
break;
|
|
|
|
|
2020-02-04 20:37:26 +01:00
|
|
|
if (av_sscanf(ptr, "%c%c%c%c", &c1, &c2, &c3, &c4) != 4)
|
2017-01-24 16:34:29 +01:00
|
|
|
break;
|
2020-06-12 20:03:42 +02:00
|
|
|
o1 = convert(c2) | (convert(c1) << 4);
|
|
|
|
o2 = convert(c4) | (convert(c3) << 4);
|
2017-01-24 16:34:29 +01:00
|
|
|
|
|
|
|
lline = NULL;
|
2020-06-12 20:03:42 +02:00
|
|
|
|
2020-06-14 21:16:57 +02:00
|
|
|
if (i > 12 && o1 == 0x94 && o2 == 0x20 && saveptr &&
|
2020-06-17 10:24:05 +02:00
|
|
|
(av_strncasecmp(saveptr, "942f", 4) && !av_strncasecmp(saveptr, "942c", 4))) {
|
2020-06-12 20:03:42 +02:00
|
|
|
|
|
|
|
sub = ff_subtitles_queue_insert(&scc->q, out, i, 0);
|
|
|
|
if (!sub)
|
2020-03-21 18:31:06 +01:00
|
|
|
return AVERROR(ENOMEM);
|
2020-06-12 20:03:42 +02:00
|
|
|
|
2020-06-16 19:13:42 +02:00
|
|
|
sub->pos = pos;
|
|
|
|
pos += i;
|
|
|
|
sub->pts = ts;
|
|
|
|
sub->duration = i * 11;
|
|
|
|
ts += sub->duration;
|
2020-06-12 20:03:42 +02:00
|
|
|
i = 0;
|
|
|
|
}
|
2020-06-14 21:16:57 +02:00
|
|
|
|
|
|
|
out[i+0] = 0xfc;
|
|
|
|
out[i+1] = o1;
|
|
|
|
out[i+2] = o2;
|
2017-01-24 16:34:29 +01:00
|
|
|
}
|
2020-06-12 20:03:42 +02:00
|
|
|
|
2017-01-24 16:34:29 +01:00
|
|
|
sub = ff_subtitles_queue_insert(&scc->q, out, i, 0);
|
|
|
|
if (!sub)
|
2020-03-21 18:31:06 +01:00
|
|
|
return AVERROR(ENOMEM);
|
2017-01-24 16:34:29 +01:00
|
|
|
|
2020-06-16 19:13:42 +02:00
|
|
|
sub->pos = pos;
|
|
|
|
sub->pts = ts;
|
2019-12-23 22:15:23 +01:00
|
|
|
}
|
2019-06-27 20:20:16 +02:00
|
|
|
|
2017-01-24 16:34:29 +01:00
|
|
|
ff_subtitles_queue_finalize(s, &scc->q);
|
|
|
|
|
2020-06-14 21:27:54 +02:00
|
|
|
return 0;
|
2017-01-24 16:34:29 +01:00
|
|
|
}
|
|
|
|
|
2024-02-10 15:50:43 +01:00
|
|
|
const FFInputFormat ff_scc_demuxer = {
|
|
|
|
.p.name = "scc",
|
|
|
|
.p.long_name = NULL_IF_CONFIG_SMALL("Scenarist Closed Captions"),
|
|
|
|
.p.extensions = "scc",
|
2017-01-24 16:34:29 +01:00
|
|
|
.priv_data_size = sizeof(SCCContext),
|
2020-03-21 18:31:06 +01:00
|
|
|
.flags_internal = FF_FMT_INIT_CLEANUP,
|
2017-01-24 16:34:29 +01:00
|
|
|
.read_probe = scc_probe,
|
|
|
|
.read_header = scc_read_header,
|
2021-07-08 23:05:08 +02:00
|
|
|
.read_packet = ff_subtitles_read_packet,
|
|
|
|
.read_seek2 = ff_subtitles_read_seek,
|
|
|
|
.read_close = ff_subtitles_read_close,
|
2017-01-24 16:34:29 +01:00
|
|
|
};
|