You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

209 lines
6.5KB

  1. /*
  2. * Copyright (c) 2012 Clément Bœsch
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. #ifndef AVFORMAT_SUBTITLES_H
  21. #define AVFORMAT_SUBTITLES_H
  22. #include <stdint.h>
  23. #include <stddef.h>
  24. #include "avformat.h"
  25. #include "libavutil/bprint.h"
  26. enum sub_sort {
  27. SUB_SORT_TS_POS = 0, ///< sort by timestamps, then position
  28. SUB_SORT_POS_TS, ///< sort by position, then timestamps
  29. };
  30. enum ff_utf_type {
  31. FF_UTF_8, // or other 8 bit encodings
  32. FF_UTF16LE,
  33. FF_UTF16BE,
  34. };
  35. typedef struct {
  36. int type;
  37. AVIOContext *pb;
  38. unsigned char buf[8];
  39. int buf_pos, buf_len;
  40. AVIOContext buf_pb;
  41. } FFTextReader;
  42. /**
  43. * Initialize the FFTextReader from the given AVIOContext. This function will
  44. * read some bytes from pb, and test for UTF-8 or UTF-16 BOMs. Further accesses
  45. * to FFTextReader will read more data from pb.
  46. *
  47. * The purpose of FFTextReader is to transparently convert read data to UTF-8
  48. * if the stream had a UTF-16 BOM.
  49. *
  50. * @param r object which will be initialized
  51. * @param pb stream to read from (referenced as long as FFTextReader is in use)
  52. */
  53. void ff_text_init_avio(FFTextReader *r, AVIOContext *pb);
  54. /**
  55. * Similar to ff_text_init_avio(), but sets it up to read from a bounded buffer.
  56. *
  57. * @param r object which will be initialized
  58. * @param buf buffer to read from (referenced as long as FFTextReader is in use)
  59. * @param size size of buf
  60. */
  61. void ff_text_init_buf(FFTextReader *r, void *buf, size_t size);
  62. /**
  63. * Return the byte position of the next byte returned by ff_text_r8(). For
  64. * UTF-16 source streams, this will return the original position, but it will
  65. * be incorrect if a codepoint was only partially read with ff_text_r8().
  66. */
  67. int64_t ff_text_pos(FFTextReader *r);
  68. /**
  69. * Return the next byte. The return value is always 0 - 255. Returns 0 on EOF.
  70. * If the source stream is UTF-16, this reads from the stream converted to
  71. * UTF-8. On invalid UTF-16, 0 is returned.
  72. */
  73. int ff_text_r8(FFTextReader *r);
  74. /**
  75. * Return non-zero if EOF was reached.
  76. */
  77. int ff_text_eof(FFTextReader *r);
  78. /**
  79. * Like ff_text_r8(), but don't remove the byte from the buffer.
  80. */
  81. int ff_text_peek_r8(FFTextReader *r);
  82. /**
  83. * Read the given number of bytes (in UTF-8). On error or EOF, \0 bytes are
  84. * written.
  85. */
  86. void ff_text_read(FFTextReader *r, char *buf, size_t size);
  87. typedef struct {
  88. AVPacket *subs; ///< array of subtitles packets
  89. int nb_subs; ///< number of subtitles packets
  90. int allocated_size; ///< allocated size for subs
  91. int current_sub_idx; ///< current position for the read packet callback
  92. enum sub_sort sort; ///< sort method to use when finalizing subtitles
  93. } FFDemuxSubtitlesQueue;
  94. /**
  95. * Insert a new subtitle event.
  96. *
  97. * @param event the subtitle line, may not be zero terminated
  98. * @param len the length of the event (in strlen() sense, so without '\0')
  99. * @param merge set to 1 if the current event should be concatenated with the
  100. * previous one instead of adding a new entry, 0 otherwise
  101. */
  102. AVPacket *ff_subtitles_queue_insert(FFDemuxSubtitlesQueue *q,
  103. const uint8_t *event, int len, int merge);
  104. /**
  105. * Set missing durations and sort subtitles by PTS, and then byte position.
  106. */
  107. void ff_subtitles_queue_finalize(FFDemuxSubtitlesQueue *q);
  108. /**
  109. * Generic read_packet() callback for subtitles demuxers using this queue
  110. * system.
  111. */
  112. int ff_subtitles_queue_read_packet(FFDemuxSubtitlesQueue *q, AVPacket *pkt);
  113. /**
  114. * Update current_sub_idx to emulate a seek. Except the first parameter, it
  115. * matches AVInputFormat->read_seek2 prototypes.
  116. */
  117. int ff_subtitles_queue_seek(FFDemuxSubtitlesQueue *q, AVFormatContext *s, int stream_index,
  118. int64_t min_ts, int64_t ts, int64_t max_ts, int flags);
  119. /**
  120. * Remove and destroy all the subtitles packets.
  121. */
  122. void ff_subtitles_queue_clean(FFDemuxSubtitlesQueue *q);
  123. /**
  124. * SMIL helper to load next chunk ("<...>" or untagged content) in buf.
  125. *
  126. * @param c cached character, to avoid a backward seek
  127. */
  128. int ff_smil_extract_next_text_chunk(FFTextReader *tr, AVBPrint *buf, char *c);
  129. /**
  130. * SMIL helper to point on the value of an attribute in the given tag.
  131. *
  132. * @param s SMIL tag ("<...>")
  133. * @param attr the attribute to look for
  134. */
  135. const char *ff_smil_get_attr_ptr(const char *s, const char *attr);
  136. /**
  137. * @brief Same as ff_subtitles_read_text_chunk(), but read from an AVIOContext.
  138. */
  139. void ff_subtitles_read_chunk(AVIOContext *pb, AVBPrint *buf);
  140. /**
  141. * @brief Read a subtitles chunk from FFTextReader.
  142. *
  143. * A chunk is defined by a multiline "event", ending with a second line break.
  144. * The trailing line breaks are trimmed. CRLF are supported.
  145. * Example: "foo\r\nbar\r\n\r\nnext" will print "foo\r\nbar" into buf, and pb
  146. * will focus on the 'n' of the "next" string.
  147. *
  148. * @param tr I/O context
  149. * @param buf an initialized buf where the chunk is written
  150. *
  151. * @note buf is cleared before writing into it.
  152. */
  153. void ff_subtitles_read_text_chunk(FFTextReader *tr, AVBPrint *buf);
  154. /**
  155. * Get the number of characters to increment to jump to the next line, or to
  156. * the end of the string.
  157. * The function handles the following line breaks schemes:
  158. * LF, CRLF (MS), or standalone CR (old MacOS).
  159. */
  160. static av_always_inline int ff_subtitles_next_line(const char *ptr)
  161. {
  162. int n = strcspn(ptr, "\r\n");
  163. ptr += n;
  164. if (*ptr == '\r') {
  165. ptr++;
  166. n++;
  167. }
  168. if (*ptr == '\n')
  169. n++;
  170. return n;
  171. }
  172. /**
  173. * Read a line of text. Discards line ending characters.
  174. * The function handles the following line breaks schemes:
  175. * LF, CRLF (MS), or standalone CR (old MacOS).
  176. *
  177. * Returns the number of bytes written to buf. Always writes a terminating 0,
  178. * similar as with snprintf.
  179. *
  180. * @note returns a negative error code if a \0 byte is found
  181. */
  182. ptrdiff_t ff_subtitles_read_line(FFTextReader *tr, char *buf, size_t size);
  183. #endif /* AVFORMAT_SUBTITLES_H */