FFmpeg
jacosubdec.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2012 Clément Bœsch
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 /**
22  * @file
23  * JACOsub subtitle demuxer
24  * @see http://unicorn.us.com/jacosub/jscripts.html
25  * @todo Support P[ALETTE] directive.
26  */
27 
28 #include "avformat.h"
29 #include "demux.h"
30 #include "internal.h"
31 #include "subtitles.h"
32 #include "libavcodec/jacosub.h"
33 #include "libavutil/avstring.h"
34 #include "libavutil/bprint.h"
35 #include "libavutil/intreadwrite.h"
36 
37 typedef struct {
39  int shift;
40  unsigned timeres;
42 
43 static int timed_line(const char *ptr)
44 {
45  char c;
46  int fs, fe;
47  return (sscanf(ptr, "%*u:%*u:%*u.%*u %*u:%*u:%*u.%*u %c", &c) == 1 ||
48  (sscanf(ptr, "@%u @%u %c", &fs, &fe, &c) == 3 && fs < fe));
49 }
50 
51 static int jacosub_probe(const AVProbeData *p)
52 {
53  const char *ptr = p->buf;
54  const char *ptr_end = p->buf + p->buf_size;
55 
56  if (AV_RB24(ptr) == 0xEFBBBF)
57  ptr += 3; /* skip UTF-8 BOM */
58 
59  while (ptr < ptr_end) {
60  while (jss_whitespace(*ptr))
61  ptr++;
62  if (*ptr != '#' && *ptr != '\n') {
63  if (timed_line(ptr))
64  return AVPROBE_SCORE_EXTENSION + 1;
65  return 0;
66  }
67  ptr += ff_subtitles_next_line(ptr);
68  }
69  return 0;
70 }
71 
72 static const char * const cmds[] = {
73  "CLOCKPAUSE",
74  "DIRECTIVE",
75  "FONT",
76  "HRES",
77  "INCLUDE",
78  "PALETTE",
79  "QUANTIZE",
80  "RAMP",
81  "SHIFT",
82  "TIMERES",
83 };
84 
85 static int get_jss_cmd(char k)
86 {
87  int i;
88 
89  k = av_toupper(k);
90  for (i = 0; i < FF_ARRAY_ELEMS(cmds); i++)
91  if (k == cmds[i][0])
92  return i;
93  return -1;
94 }
95 
96 static const char *read_ts(JACOsubContext *jacosub, const char *buf,
97  int64_t *start, int64_t *duration)
98 {
99  int len;
100  unsigned hs, ms, ss, fs; // hours, minutes, seconds, frame start
101  unsigned he, me, se, fe; // hours, minutes, seconds, frame end
102  int ts_start, ts_end;
103  int64_t ts_start64, ts_end64;
104 
105  /* timed format */
106  if (sscanf(buf, "%u:%u:%u.%u %u:%u:%u.%u %n",
107  &hs, &ms, &ss, &fs,
108  &he, &me, &se, &fe, &len) == 8) {
109  ts_start = (hs*3600 + ms*60 + ss) * jacosub->timeres + fs;
110  ts_end = (he*3600 + me*60 + se) * jacosub->timeres + fe;
111  goto shift_and_ret;
112  }
113 
114  /* timestamps format */
115  if (sscanf(buf, "@%u @%u %n", &ts_start, &ts_end, &len) == 2)
116  goto shift_and_ret;
117 
118  return NULL;
119 
120 shift_and_ret:
121  ts_start64 = (ts_start + (int64_t)jacosub->shift) * 100LL / jacosub->timeres;
122  ts_end64 = (ts_end + (int64_t)jacosub->shift) * 100LL / jacosub->timeres;
123  *start = ts_start64;
124  *duration = ts_end64 - ts_start64;
125  return buf + len;
126 }
127 
128 static int get_shift(unsigned timeres, const char *buf)
129 {
130  int sign = 1;
131  int h = 0, m = 0, s = 0, d = 0;
132  int64_t ret;
133 #define SSEP "%*1[.:]"
134  int n = sscanf(buf, "%d"SSEP"%d"SSEP"%d"SSEP"%d", &h, &m, &s, &d);
135 #undef SSEP
136 
137  if (h == INT_MIN)
138  return 0;
139 
140  if (*buf == '-' || h < 0) {
141  sign = -1;
142  h = FFABS(h);
143  }
144 
145  ret = 0;
146  switch (n) {
147  case 1: h = 0; //clear all in case of a single parameter
148  case 2: s = m; m = h; h = 0; //shift into second subsecondd
149  case 3: d = s; s = m; m = h; h = 0; //shift into minute second subsecond
150  }
151 
152  ret = (int64_t)h*3600 + (int64_t)m*60 + s;
153  if (FFABS(ret) > (INT64_MAX - FFABS((int64_t)d)) / timeres)
154  return 0;
155  ret = sign * (ret * timeres + d);
156 
157  if ((int)ret != ret)
158  ret = 0;
159 
160  return ret;
161 }
162 
164 {
165  AVBPrint header;
166  AVIOContext *pb = s->pb;
167  char line[JSS_MAX_LINESIZE];
168  JACOsubContext *jacosub = s->priv_data;
169  int shift_set = 0; // only the first shift matters
170  int merge_line = 0;
171  int i, ret;
172 
174  if (!st)
175  return AVERROR(ENOMEM);
176  avpriv_set_pts_info(st, 64, 1, 100);
179 
180  jacosub->timeres = 30;
181 
183 
184  while (!avio_feof(pb)) {
185  int cmd_len;
186  const char *p = line;
187  int64_t pos = avio_tell(pb);
188  int len = ff_get_line(pb, line, sizeof(line));
189 
190  p = jss_skip_whitespace(p);
191 
192  /* queue timed line */
193  if (merge_line || timed_line(p)) {
194  AVPacket *sub;
195 
196  sub = ff_subtitles_queue_insert(&jacosub->q, line, len, merge_line);
197  if (!sub) {
199  return AVERROR(ENOMEM);
200  }
201  sub->pos = pos;
202  merge_line = len > 1 && !strcmp(&line[len - 2], "\\\n");
203  continue;
204  }
205 
206  /* skip all non-compiler commands and focus on the command */
207  if (*p != '#')
208  continue;
209  p++;
210  i = get_jss_cmd(p[0]);
211  if (i == -1)
212  continue;
213 
214  /* trim command + spaces */
215  cmd_len = strlen(cmds[i]);
216  if (av_strncasecmp(p, cmds[i], cmd_len) == 0)
217  p += cmd_len;
218  else
219  p++;
220  p = jss_skip_whitespace(p);
221 
222  /* handle commands which affect the whole script */
223  switch (cmds[i][0]) {
224  case 'S': // SHIFT command affect the whole script...
225  if (!shift_set) {
226  jacosub->shift = get_shift(jacosub->timeres, p);
227  shift_set = 1;
228  }
229  av_bprintf(&header, "#S %s", p);
230  break;
231  case 'T': { // ...but must be placed after TIMERES
232  int64_t timeres = strtol(p, NULL, 10);
233  if (timeres <= 0 || timeres > UINT32_MAX) {
234  jacosub->timeres = 30;
235  } else {
236  jacosub->timeres = timeres;
237  av_bprintf(&header, "#T %s", p);
238  }
239  break;
240  }
241  }
242  }
243 
244  /* general/essential directives in the extradata */
246  if (ret < 0)
247  return ret;
248 
249  /* SHIFT and TIMERES affect the whole script so packet timing can only be
250  * done in a second pass */
251  for (i = 0; i < jacosub->q.nb_subs; i++) {
252  AVPacket *sub = jacosub->q.subs[i];
253  read_ts(jacosub, sub->data, &sub->pts, &sub->duration);
254  }
255  ff_subtitles_queue_finalize(s, &jacosub->q);
256 
257  return 0;
258 }
259 
261  .p.name = "jacosub",
262  .p.long_name = NULL_IF_CONFIG_SMALL("JACOsub subtitle format"),
263  .priv_data_size = sizeof(JACOsubContext),
264  .flags_internal = FF_INFMT_FLAG_INIT_CLEANUP,
268  .read_seek2 = ff_subtitles_read_seek,
270 };
AVMEDIA_TYPE_SUBTITLE
@ AVMEDIA_TYPE_SUBTITLE
Definition: avutil.h:204
ff_subtitles_read_close
int ff_subtitles_read_close(AVFormatContext *s)
Definition: subtitles.c:345
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
AVCodecParameters::codec_type
enum AVMediaType codec_type
General type of the encoded data.
Definition: codec_par.h:51
av_bprint_init
void av_bprint_init(AVBPrint *buf, unsigned size_init, unsigned size_max)
Definition: bprint.c:69
get_jss_cmd
static int get_jss_cmd(char k)
Definition: jacosubdec.c:85
avformat_new_stream
AVStream * avformat_new_stream(AVFormatContext *s, const struct AVCodec *c)
Add a new stream to a media file.
FFDemuxSubtitlesQueue::nb_subs
int nb_subs
number of subtitles packets
Definition: subtitles.h:105
int64_t
long long int64_t
Definition: coverity.c:34
se
#define se(name, range_min, range_max)
Definition: cbs_h2645.c:260
AVPacket::data
uint8_t * data
Definition: packet.h:539
AVPacket::duration
int64_t duration
Duration of this packet in AVStream->time_base units, 0 if unknown.
Definition: packet.h:557
AVProbeData::buf_size
int buf_size
Size of buf except extra allocated bytes.
Definition: avformat.h:454
ff_bprint_to_codecpar_extradata
int ff_bprint_to_codecpar_extradata(AVCodecParameters *par, struct AVBPrint *buf)
Finalize buf into extradata and set its size appropriately.
Definition: utils.c:577
get_shift
static int get_shift(unsigned timeres, const char *buf)
Definition: jacosubdec.c:128
avpriv_set_pts_info
void avpriv_set_pts_info(AVStream *st, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
Definition: avformat.c:867
read_close
static av_cold int read_close(AVFormatContext *ctx)
Definition: libcdio.c:143
avio_tell
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:494
JSS_MAX_LINESIZE
#define JSS_MAX_LINESIZE
Definition: jacosub.h:31
AV_CODEC_ID_JACOSUB
@ AV_CODEC_ID_JACOSUB
Definition: codec_id.h:569
ss
#define ss(width, name, subs,...)
Definition: cbs_vp9.c:202
FF_ARRAY_ELEMS
#define FF_ARRAY_ELEMS(a)
Definition: sinewin_tablegen.c:29
jacosub_read_header
static int jacosub_read_header(AVFormatContext *s)
Definition: jacosubdec.c:163
ff_subtitles_read_packet
int ff_subtitles_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: subtitles.c:331
duration
int64_t duration
Definition: movenc.c:65
read_packet
static int read_packet(void *opaque, uint8_t *buf, int buf_size)
Definition: avio_read_callback.c:42
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:198
AVInputFormat::name
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:553
AVProbeData::buf
unsigned char * buf
Buffer must have AVPROBE_PADDING_SIZE of extra allocated bytes filled with zero.
Definition: avformat.h:453
FFABS
#define FFABS(a)
Absolute value, Note, INT_MIN / INT64_MIN result in undefined behavior as they are not representable ...
Definition: common.h:74
FF_INFMT_FLAG_INIT_CLEANUP
#define FF_INFMT_FLAG_INIT_CLEANUP
For an FFInputFormat with this flag set read_close() needs to be called by the caller upon read_heade...
Definition: demux.h:35
JACOsubContext
Definition: jacosubdec.c:37
AVFormatContext
Format I/O context.
Definition: avformat.h:1300
internal.h
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:771
read_header
static int read_header(FFV1Context *f)
Definition: ffv1dec.c:540
NULL
#define NULL
Definition: coverity.c:32
fs
#define fs(width, name, subs,...)
Definition: cbs_vp9.c:200
cmds
static const char *const cmds[]
Definition: jacosubdec.c:72
me
#define me
Definition: vf_colormatrix.c:102
AVProbeData
This structure contains the data a format has to probe a file.
Definition: avformat.h:451
ff_subtitles_queue_insert
AVPacket * ff_subtitles_queue_insert(FFDemuxSubtitlesQueue *q, const uint8_t *event, size_t len, int merge)
Insert a new subtitle event.
Definition: subtitles.c:111
c
Undefined Behavior In the C some operations are like signed integer dereferencing freed accessing outside allocated Undefined Behavior must not occur in a C it is not safe even if the output of undefined operations is unused The unsafety may seem nit picking but Optimizing compilers have in fact optimized code on the assumption that no undefined Behavior occurs Optimizing code based on wrong assumptions can and has in some cases lead to effects beyond the output of computations The signed integer overflow problem in speed critical code Code which is highly optimized and works with signed integers sometimes has the problem that often the output of the computation does not c
Definition: undefined.txt:32
AVPROBE_SCORE_EXTENSION
#define AVPROBE_SCORE_EXTENSION
score for file extension
Definition: avformat.h:461
jacosub_probe
static int jacosub_probe(const AVProbeData *p)
Definition: jacosubdec.c:51
jacosub.h
av_strncasecmp
int av_strncasecmp(const char *a, const char *b, size_t n)
Locale-independent case-insensitive compare.
Definition: avstring.c:217
AVIOContext
Bytestream IO Context.
Definition: avio.h:160
NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification.
Definition: internal.h:94
av_bprint_finalize
int av_bprint_finalize(AVBPrint *buf, char **ret_str)
Finalize a print buffer.
Definition: bprint.c:240
jss_whitespace
static av_always_inline int jss_whitespace(char c)
Definition: jacosub.h:33
ff_subtitles_queue_finalize
void ff_subtitles_queue_finalize(void *log_ctx, FFDemuxSubtitlesQueue *q)
Set missing durations, sort subtitles by PTS (and then byte position), and drop duplicated events.
Definition: subtitles.c:212
FFDemuxSubtitlesQueue
Definition: subtitles.h:103
FFInputFormat::p
AVInputFormat p
The public AVInputFormat.
Definition: demux.h:46
header
static const uint8_t header[24]
Definition: sdr2.c:68
JACOsubContext::shift
int shift
Definition: jacosubdec.c:39
line
Definition: graph2dot.c:48
jss_skip_whitespace
static const av_always_inline char * jss_skip_whitespace(const char *p)
Definition: jacosub.h:38
SSEP
#define SSEP
bprint.h
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
AVPacket::pts
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
Definition: packet.h:532
FFDemuxSubtitlesQueue::subs
AVPacket ** subs
array of subtitles packets
Definition: subtitles.h:104
JACOsubContext::q
FFDemuxSubtitlesQueue q
Definition: jacosubdec.c:38
av_toupper
static av_const int av_toupper(int c)
Locale-independent conversion of ASCII characters to uppercase.
Definition: avstring.h:227
ff_subtitles_read_seek
int ff_subtitles_read_seek(AVFormatContext *s, int stream_index, int64_t min_ts, int64_t ts, int64_t max_ts, int flags)
Definition: subtitles.c:337
ff_get_line
int ff_get_line(AVIOContext *s, char *buf, int maxlen)
Read a whole line of text from AVIOContext.
Definition: aviobuf.c:769
demux.h
len
int len
Definition: vorbis_enc_data.h:426
ret
ret
Definition: filter_design.txt:187
AVStream
Stream structure.
Definition: avformat.h:748
pos
unsigned int pos
Definition: spdifenc.c:414
avformat.h
av_bprintf
void av_bprintf(AVBPrint *buf, const char *fmt,...)
Definition: bprint.c:99
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: defs.h:40
subtitles.h
read_ts
static const char * read_ts(JACOsubContext *jacosub, const char *buf, int64_t *start, int64_t *duration)
Definition: jacosubdec.c:96
read_probe
static int read_probe(const AVProbeData *p)
Definition: cdg.c:30
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:55
AVPacket
This structure stores compressed data.
Definition: packet.h:516
JACOsubContext::timeres
unsigned timeres
Definition: jacosubdec.c:40
AVPacket::pos
int64_t pos
byte position in stream, -1 if unknown
Definition: packet.h:559
FFInputFormat
Definition: demux.h:42
h
h
Definition: vp9dsp_template.c:2070
ff_subtitles_next_line
static av_always_inline int ff_subtitles_next_line(const char *ptr)
Get the number of characters to increment to jump to the next line, or to the end of the string.
Definition: subtitles.h:205
avstring.h
ff_jacosub_demuxer
const FFInputFormat ff_jacosub_demuxer
Definition: jacosubdec.c:260
AV_RB24
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_WL16 uint64_t_TMPL AV_WB64 unsigned int_TMPL AV_WB32 unsigned int_TMPL AV_RB24
Definition: bytestream.h:97
line
The official guide to swscale for confused that consecutive non overlapping rectangles of slice_bottom special converter These generally are unscaled converters of common like for each output line the vertical scaler pulls lines from a ring buffer When the ring buffer does not contain the wanted line
Definition: swscale.txt:40
timed_line
static int timed_line(const char *ptr)
Definition: jacosubdec.c:43
avio_feof
int avio_feof(AVIOContext *s)
Similar to feof() but also returns nonzero on read errors.
Definition: aviobuf.c:346