On 01/03/2015 01:42 AM, Michael Niedermayer wrote:
> On Wed, Dec 31, 2014 at 07:09:33PM +0530, Anshul wrote:
> [...]
>
>> +static void build_parity_table(int *parity_table)
>> +{
>> + unsigned int byte;
>> + int parity_v;
>> + for (byte = 0; byte <= 127; byte++) {
>> + parity_v = av_popcount(byte) & 1;
>> + parity_table[byte] = parity_v;
>> + parity_table[byte | 0x80] = !parity_v;
>> + }
>> +}
> This should not be needed, av_popcount(byte) & 1 could be used
> directly or you could use something like this: (untested)
> (0x6996 >> ((byte ^ (byte>>4)) & 15)) & 1
>
> the code using the parity stuff does not seem speed critical
> but maybe iam missing something ?
parity is checked for each byte of data in closed caption, so I thought
it would be speed critical. only 7 bits are used in each byte. 1 bit is
fr parity.
> [...]
>
>> +static void handle_pac( CCaptionSubContext *ctx, uint8_t hi, uint8_t lo )
>> +{
>> + static const uint8_t row_map[] = {
>> + 11, -1, 1, 2, 3, 4, 12, 13, 14, 15, 5, 6, 7, 8, 9, 10
>> + };
> you are having negative values in a unsigned 8bit table
> i assume either of these is not intended
done, -1 was needed.
changed uint8_t to int8_t
>
> [...]
>> +static int process_cc608(CCaptionSubContext *ctx, int64_t pts, uint8_t hi,
>> uint8_t lo)
>> +{
>> + int ret = 0;
>> +#define COR3(var, with1, with2, with3) ( (var) == (with1) || (var) ==
>> (with2) || (var) == (with3) )
>> + if ( hi == ctx->prev_cmd[0] && lo == ctx->prev_cmd[1]) {
>> + /* ignore redundant command */
>> + } else if ( (hi == 0x10 && (lo >= 0x40 || lo <= 0x5f)) ||
>> + ( (hi >= 0x11 && hi <= 0x17) && (lo >= 0x40 && lo <= 0x7f) )
>> ) {
>> + handle_pac(ctx, hi, lo);
>> + } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x20 ) {
>> + /* resume caption loading */
>> + ctx->mode = CCMODE_POPON;
>> + } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x25 ) {
>> + ctx->rollup = 2;
>> + } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x26 ) {
>> + ctx->rollup = 3;
>> + } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x27 ) {
>> + ctx->rollup = 4;
>> + } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x29 ) {
>> + /* resume direct captioning */
>> + ctx->mode = CCMODE_PAINTON;
>> + } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x2C ) {
>> + /* erase display memory */
>> + ret = handle_edm(ctx, pts);
>> + } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x2D ) {
>> + /* carriage return */
>> + av_log(ctx, AV_LOG_DEBUG,"cdp (handle cr)\n");
>> + ctx->row_cnt++;
>> + if(ctx->row_cnt == ctx->rollup) {
>> + ctx->row_cnt = 0;
>> + ret = handle_edm(ctx, pts);
>> + ctx->active_screen = !ctx->active_screen;
>> + }
>> + } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x2F ) {
>> + /* end of caption */
>> + ret = handle_eoc(ctx, pts);
>> + } else if (hi>=0x20) {
>> + /* Standard characters (always in pairs) */
>> + handle_char(ctx, hi, lo, pts);
>> + } else {
>> + /* Ignoring all other non data code */
>> + }
>> +
>> + /* set prev command */
>> + ctx->prev_cmd[0] = hi;
>> + ctx->prev_cmd[1] = lo;
>> +
>> +#undef COR3
>> + return ret;
>> +
>> +}
>> +static int decode(AVCodecContext *avctx, void *data, int *got_sub, AVPacket
>> *avpkt)
>> +{
>> + CCaptionSubContext *ctx = avctx->priv_data;
>> + AVSubtitle *sub = data;
>> + uint8_t *bptr = avpkt->data;
> The input packets data is read only unless you do something
> (dup/memcpy/whatever) so this should be const
copied data in AVbufferRef.
>
>> + int len = avpkt->size;
>> + int ret = 0;
>> + int i;
>> +
>> + for (i = 0; i < len; i += 3) {
>> + uint8_t cc_type = *(bptr + i) & 3;
>> + if (validate_cc_data_pair( bptr + i, ctx->parity_table ) )
>> + continue;
>> + /* ignoring data field 1 */
>> + if(cc_type == 1)
>> + continue;
>> + else
>> + process_cc608(ctx, avpkt->pts, *(bptr + i + 1), *(bptr + i +
>> 2));
>> + }
>> + if(ctx->erase_display_memory && *ctx->buffer.str)
>> + {
>> + int start_time = av_rescale_q(ctx->start_time, avctx->time_base,
>> (AVRational){ 1, 100 });
>> + int end_time = av_rescale_q(ctx->end_time, avctx->time_base,
>> (AVRational){ 1, 100 });
>> + av_log(ctx, AV_LOG_DEBUG,"cdp writing data (%s)\n",ctx->buffer.str);
> tabs, also theres a alot of deug av_logs in the code, it might make
> sense to remove or disable these before its pushed
most of the logs I have removed, others I have disabled.
I have attached 2 pacth 1 improvement of this other is info regarding
1st one.
-Anshul
>From 17a564409b84fc18293833cc3f2151792209bb8b Mon Sep 17 00:00:00 2001
From: Anshul Maheshwari <[email protected]>
Date: Sat, 3 Jan 2015 12:40:35 +0530
Subject: [PATCH 1/2] Adding Closed caption Support
Signed-off-by: Anshul Maheshwari <[email protected]>
To test Closed caption use following command
/ffmpeg -f lavfi -i "movie=/home/a141982112/test_videos/Starship_Troopers.vob[out0+subcc]" -map s some.srt
---
libavcodec/Makefile | 1 +
libavcodec/allcodecs.c | 1 +
libavcodec/ccaption_dec.c | 361 ++++++++++++++++++++++++++++++++++++++++++++++
3 files changed, 363 insertions(+)
create mode 100644 libavcodec/ccaption_dec.c
diff --git a/libavcodec/Makefile b/libavcodec/Makefile
index 107661b..33051c4 100644
--- a/libavcodec/Makefile
+++ b/libavcodec/Makefile
@@ -173,6 +173,7 @@ OBJS-$(CONFIG_BRENDER_PIX_DECODER) += brenderpix.o
OBJS-$(CONFIG_C93_DECODER) += c93.o
OBJS-$(CONFIG_CAVS_DECODER) += cavs.o cavsdec.o cavsdsp.o \
cavsdata.o mpeg12data.o
+OBJS-$(CONFIG_CCAPTION_DECODER) += ccaption_dec.o
OBJS-$(CONFIG_CDGRAPHICS_DECODER) += cdgraphics.o
OBJS-$(CONFIG_CDXL_DECODER) += cdxl.o
OBJS-$(CONFIG_CINEPAK_DECODER) += cinepak.o
diff --git a/libavcodec/allcodecs.c b/libavcodec/allcodecs.c
index 8ceee2f..ef77dec 100644
--- a/libavcodec/allcodecs.c
+++ b/libavcodec/allcodecs.c
@@ -481,6 +481,7 @@ void avcodec_register_all(void)
/* subtitles */
REGISTER_ENCDEC (SSA, ssa);
REGISTER_ENCDEC (ASS, ass);
+ REGISTER_DECODER(CCAPTION, ccaption);
REGISTER_ENCDEC (DVBSUB, dvbsub);
REGISTER_ENCDEC (DVDSUB, dvdsub);
REGISTER_DECODER(JACOSUB, jacosub);
diff --git a/libavcodec/ccaption_dec.c b/libavcodec/ccaption_dec.c
new file mode 100644
index 0000000..d351efe
--- /dev/null
+++ b/libavcodec/ccaption_dec.c
@@ -0,0 +1,361 @@
+/*
+ * Closed Caption Decoding
+ * Copyright (c) 2014 Anshul Maheshwari
+ *
+ * This file is part of FFmpeg.
+ *
+ * FFmpeg is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU Lesser General Public
+ * License as published by the Free Software Foundation; either
+ * version 2.1 of the License, or (at your option) any later version.
+ *
+ * FFmpeg is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+ * Lesser General Public License for more details.
+ *
+ * You should have received a copy of the GNU Lesser General Public
+ * License along with FFmpeg; if not, write to the Free Software
+ * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
+ */
+
+#include "avcodec.h"
+#include "ass.h"
+#include "libavutil/opt.h"
+
+#undef CHAR_DEBUG
+#define SCREEN_ROWS 15
+#define SCREEN_COLUMNS 32
+
+#define SET_FLAG(var, val) ( var |= ( 1 << (val) ) )
+#define UNSET_FLAG(var, val) ( var &= ~( 1 << (val)) )
+#define CHECK_FLAG(var, val) ( (var) & (1 << (val) ) )
+
+enum cc_mode {
+ CCMODE_POPON,
+ CCMODE_PAINTON,
+ CCMODE_ROLLUP_2,
+ CCMODE_ROLLUP_3,
+ CCMODE_ROLLUP_4,
+ CCMODE_TEXT,
+};
+
+struct Screen {
+ /* +1 is used to compensate null character of string */
+ uint8_t characters[SCREEN_ROWS][SCREEN_COLUMNS+1];
+ /*
+ * Bitmask of used rows; if a bit is not set, the
+ * corresponding row is not used.
+ * for setting row 1 use row | (0 << 1)
+ * for setting row 15 use row | (1 << 14)
+ */
+ int16_t row_used;
+};
+
+
+typedef struct CCaptionSubContext {
+ AVClass *class;
+ int parity_table[256];
+ int row_cnt;
+ struct Screen screen[2];
+ int active_screen;
+ uint8_t cursor_row;
+ uint8_t cursor_column;
+ AVBPrint buffer;
+ int erase_display_memory;
+ int rollup;
+ enum cc_mode mode;
+ int64_t start_time;
+ /* visible screen time */
+ int64_t startv_time;
+ int64_t end_time;
+ char prev_cmd[2];
+ /* buffer to store pkt data */
+ AVBufferRef *pktbuf;
+}CCaptionSubContext;
+
+static void build_parity_table(int *parity_table)
+{
+ unsigned int byte;
+ int parity_v;
+ for (byte = 0; byte <= 127; byte++) {
+ parity_v = av_popcount(byte) & 1;
+ parity_table[byte] = parity_v;
+ parity_table[byte | 0x80] = !parity_v;
+ }
+}
+
+static av_cold int init_decoder(AVCodecContext *avctx)
+{
+ int ret;
+ CCaptionSubContext *ctx = avctx->priv_data;
+
+ build_parity_table(ctx->parity_table);
+ av_bprint_init(&ctx->buffer, 0, AV_BPRINT_SIZE_UNLIMITED);
+ /* taking by default roll up to 2 */
+ ctx->rollup = 2;
+ ret = ff_ass_subtitle_header_default(avctx);
+ /* allocate pkt buffer */
+ ctx->pktbuf = av_buffer_alloc(128);
+ if( !ctx->pktbuf) {
+ ret = AVERROR(ENOMEM);
+ }
+
+
+ return ret;
+}
+
+static av_cold int close_decoder(AVCodecContext *avctx)
+{
+ CCaptionSubContext *ctx = avctx->priv_data;
+ av_bprint_finalize( &ctx->buffer, NULL);
+ av_buffer_unref(&ctx->pktbuf);
+ return 0;
+}
+
+/**
+ * This function after validating parity bit, also remove it from data pair.
+ */
+static int validate_cc_data_pair (uint8_t *cc_data_pair, int *parity_table)
+{
+ uint8_t cc_valid = (*cc_data_pair & 4) >>2;
+ uint8_t cc_type = *cc_data_pair & 3;
+
+ if (!cc_valid)
+ return AVERROR_INVALIDDATA;
+
+ // if EIA-608 data then verify parity.
+ if (cc_type==0 || cc_type==1) {
+ if (!parity_table[cc_data_pair[2]]) {
+ // If the second byte doesn't pass parity, ignore pair
+ return AVERROR_INVALIDDATA;
+ }
+ if (!parity_table[cc_data_pair[1]]) {
+ // The first byte doesn't pass parity, we replace it with a solid blank
+ // and process the pair.
+ cc_data_pair[1]=0x7F;
+ }
+ }
+
+ //Skip non-data
+ if( (cc_data_pair[0] == 0xFA || cc_data_pair[0] == 0xFC || cc_data_pair[0] == 0xFD )
+ && (cc_data_pair[1] & 0x7F) == 0 && (cc_data_pair[2] & 0x7F) == 0)
+ return AVERROR_PATCHWELCOME;
+
+ //skip 708 data
+ if(cc_type == 3 || cc_type == 2 )
+ return AVERROR_PATCHWELCOME;
+
+ /* remove parity bit */
+ cc_data_pair[1] &= 0x7F;
+ cc_data_pair[2] &= 0x7F;
+
+
+ return 0;
+
+}
+static void handle_pac( CCaptionSubContext *ctx, uint8_t hi, uint8_t lo )
+{
+ static const int8_t row_map[] = {
+ 11, -1, 1, 2, 3, 4, 12, 13, 14, 15, 5, 6, 7, 8, 9, 10
+ };
+ const int index = ( (hi<<1) & 0x0e) | ( (lo>>5) & 0x01 );
+
+ if( row_map[index] <= 0 )
+ return;
+
+ ctx->cursor_row = row_map[index] - 1;
+ ctx->cursor_column = 0;
+
+}
+
+/**
+ * @param pts it is required to set end time
+ */
+static int handle_edm(CCaptionSubContext *ctx,int64_t pts)
+{
+ int i;
+ int ret = 0;
+ struct Screen *screen = ctx->screen + ctx->active_screen;
+
+ ctx->start_time = ctx->startv_time;
+ for( i = 0; screen->row_used && i < SCREEN_ROWS; i++)
+ {
+ if(CHECK_FLAG(screen->row_used,i)) {
+ av_bprint_append_data(&ctx->buffer, screen->characters[i], strlen(screen->characters[i]));
+ av_bprint_append_data(&ctx->buffer, "\\N",2);
+ UNSET_FLAG(screen->row_used, i);
+ ret = av_bprint_is_complete(&ctx->buffer);
+ if( ret) {
+ ret = AVERROR(ENOMEM);
+ break;
+ }
+ }
+
+ }
+ ctx->startv_time = pts;
+ ctx->erase_display_memory = 1;
+ ctx->end_time = pts;
+ return ret;
+}
+static int handle_eoc(CCaptionSubContext *ctx, int64_t pts)
+{
+ int ret;
+ ret = handle_edm(ctx,pts);
+ ctx->active_screen = !ctx->active_screen;
+ return ret;
+}
+static struct Screen *get_writing_screen(CCaptionSubContext *ctx)
+{
+ switch (ctx->mode) {
+ case CCMODE_POPON:
+ // use Inactive screen
+ return ctx->screen + !ctx->active_screen;
+ case CCMODE_PAINTON:
+ case CCMODE_ROLLUP_2:
+ case CCMODE_ROLLUP_3:
+ case CCMODE_ROLLUP_4:
+ case CCMODE_TEXT:
+ // use active screen
+ return ctx->screen + ctx->active_screen;
+ }
+ /* It was never an option */
+ return NULL;
+}
+static void handle_char(CCaptionSubContext *ctx, char hi, char lo, int64_t pts)
+{
+ struct Screen *screen = get_writing_screen(ctx);
+ char *row = screen->characters[ctx->cursor_row] + ctx->cursor_column;
+
+ SET_FLAG(screen->row_used,ctx->cursor_row);
+
+ *row++ = hi;
+ ctx->cursor_column++;
+ if(lo) {
+ *row++ = lo;
+ ctx->cursor_column++;
+ }
+ *row = 0;
+ /* reset prev command since character can repeat */
+ ctx->prev_cmd[0] = 0;
+ ctx->prev_cmd[1] = 0;
+#ifdef CHAR_DEBUG
+ av_log(ctx, AV_LOG_DEBUG,"(%c,%c)\n",hi,lo);
+#endif
+}
+static int process_cc608(CCaptionSubContext *ctx, int64_t pts, uint8_t hi, uint8_t lo)
+{
+ int ret = 0;
+#define COR3(var, with1, with2, with3) ( (var) == (with1) || (var) == (with2) || (var) == (with3) )
+ if ( hi == ctx->prev_cmd[0] && lo == ctx->prev_cmd[1]) {
+ /* ignore redundant command */
+ } else if ( (hi == 0x10 && (lo >= 0x40 || lo <= 0x5f)) ||
+ ( (hi >= 0x11 && hi <= 0x17) && (lo >= 0x40 && lo <= 0x7f) ) ) {
+ handle_pac(ctx, hi, lo);
+ } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x20 ) {
+ /* resume caption loading */
+ ctx->mode = CCMODE_POPON;
+ } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x25 ) {
+ ctx->rollup = 2;
+ } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x26 ) {
+ ctx->rollup = 3;
+ } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x27 ) {
+ ctx->rollup = 4;
+ } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x29 ) {
+ /* resume direct captioning */
+ ctx->mode = CCMODE_PAINTON;
+ } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x2C ) {
+ /* erase display memory */
+ ret = handle_edm(ctx, pts);
+ } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x2D ) {
+ /* carriage return */
+ ctx->row_cnt++;
+ if(ctx->row_cnt == ctx->rollup) {
+ ctx->row_cnt = 0;
+ ret = handle_edm(ctx, pts);
+ ctx->active_screen = !ctx->active_screen;
+ }
+ } else if ( COR3(hi, 0x14, 0x15, 0x1C) && lo == 0x2F ) {
+ /* end of caption */
+ ret = handle_eoc(ctx, pts);
+ } else if (hi>=0x20) {
+ /* Standard characters (always in pairs) */
+ handle_char(ctx, hi, lo, pts);
+ } else {
+ /* Ignoring all other non data code */
+ }
+
+ /* set prev command */
+ ctx->prev_cmd[0] = hi;
+ ctx->prev_cmd[1] = lo;
+
+#undef COR3
+ return ret;
+
+}
+static int decode(AVCodecContext *avctx, void *data, int *got_sub, AVPacket *avpkt)
+{
+ CCaptionSubContext *ctx = avctx->priv_data;
+ AVSubtitle *sub = data;
+ uint8_t *bptr = NULL;
+ int len = avpkt->size;
+ int ret = 0;
+ int i;
+
+ if ( ctx->pktbuf->size < len) {
+ ret = av_buffer_realloc(&ctx->pktbuf, len);
+ if(ret)
+ len = ctx->pktbuf->size;
+ }
+ memcpy(ctx->pktbuf->data, avpkt->data, len);
+ bptr = ctx->pktbuf->data;
+
+ for (i = 0; i < len; i += 3) {
+ uint8_t cc_type = *(bptr + i) & 3;
+ if (validate_cc_data_pair( bptr + i, ctx->parity_table ) )
+ continue;
+ /* ignoring data field 1 */
+ if(cc_type == 1)
+ continue;
+ else
+ process_cc608(ctx, avpkt->pts, *(bptr + i + 1), *(bptr + i + 2));
+ }
+ if(ctx->erase_display_memory && *ctx->buffer.str)
+ {
+ int start_time = av_rescale_q(ctx->start_time, avctx->time_base, (AVRational){ 1, 100 });
+ int end_time = av_rescale_q(ctx->end_time, avctx->time_base, (AVRational){ 1, 100 });
+#ifdef CHAR_DEBUG
+ av_log(ctx, AV_LOG_DEBUG,"cdp writing data (%s)\n",ctx->buffer.str);
+#endif
+ ret = ff_ass_add_rect(sub, ctx->buffer.str, start_time, end_time - start_time , 0);
+ if (ret < 0)
+ return ret;
+ sub->pts = av_rescale_q(ctx->start_time, avctx->time_base, AV_TIME_BASE_Q);
+ ctx->erase_display_memory = 0;
+ av_bprint_clear(&ctx->buffer);
+ }
+
+ *got_sub = sub->num_rects > 0;
+ return 0;
+}
+static const AVOption options[] = {
+ {NULL}
+};
+static const AVClass ccaption_dec_class = {
+ .class_name = "Closed caption Decoder",
+ .item_name = av_default_item_name,
+ .option = options,
+ .version = LIBAVUTIL_VERSION_INT,
+};
+
+AVCodec ff_ccaption_decoder = {
+ .name = "cc_dec",
+ .long_name = NULL_IF_CONFIG_SMALL("Closed Caption (EIA-608 / CEA-708) Decoder"),
+ .type = AVMEDIA_TYPE_SUBTITLE,
+ .id = AV_CODEC_ID_EIA_608,
+ .priv_data_size = sizeof(CCaptionSubContext),
+ .init = init_decoder,
+ .close = close_decoder,
+ .decode = decode,
+ .priv_class = &ccaption_dec_class,
+};
--
1.8.1.4
>From e0c5ebb592d33c05446dcab019e5a2cb14185569 Mon Sep 17 00:00:00 2001
From: Anshul Maheshwari <[email protected]>
Date: Sat, 3 Jan 2015 12:48:37 +0530
Subject: [PATCH 2/2] Adding Closed caption accessories
Signed-off-by: Anshul Maheshwari <[email protected]>
---
Changelog | 1 +
MAINTAINERS | 1 +
libavcodec/version.h | 2 +-
3 files changed, 3 insertions(+), 1 deletion(-)
diff --git a/Changelog b/Changelog
index 37ce0f0..d4efd74 100644
--- a/Changelog
+++ b/Changelog
@@ -9,6 +9,7 @@ version <next>:
- RTP/mpegts muxer
- non continuous cache protocol support
- tblend filter
+- Closed caption Decoder
version 2.5:
diff --git a/MAINTAINERS b/MAINTAINERS
index 6e46280..13b211e 100644
--- a/MAINTAINERS
+++ b/MAINTAINERS
@@ -156,6 +156,7 @@ Codecs:
celp_filters.* Vitor Sessak
cinepak.c Roberto Togni
cinepakenc.c Rl / Aetey G.T. AB
+ ccaption_dec.c Anshul Maheshwari
cljr Alex Beregszaszi
cllc.c Derek Buitenhuis
cook.c, cookdata.h Benjamin Larsson
diff --git a/libavcodec/version.h b/libavcodec/version.h
index d8c891d..7e51f3b 100644
--- a/libavcodec/version.h
+++ b/libavcodec/version.h
@@ -29,7 +29,7 @@
#include "libavutil/version.h"
#define LIBAVCODEC_VERSION_MAJOR 56
-#define LIBAVCODEC_VERSION_MINOR 19
+#define LIBAVCODEC_VERSION_MINOR 20
#define LIBAVCODEC_VERSION_MICRO 100
#define LIBAVCODEC_VERSION_INT AV_VERSION_INT(LIBAVCODEC_VERSION_MAJOR, \
--
1.8.1.4
_______________________________________________
ffmpeg-devel mailing list
[email protected]
http://ffmpeg.org/mailman/listinfo/ffmpeg-devel