You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

211 lines
6.7KB

  1. /*
  2. * Copyright (c) 2012 Clément Bœsch
  3. *
  4. * This file is part of FFmpeg.
  5. *
  6. * FFmpeg is free software; you can redistribute it and/or
  7. * modify it under the terms of the GNU Lesser General Public
  8. * License as published by the Free Software Foundation; either
  9. * version 2.1 of the License, or (at your option) any later version.
  10. *
  11. * FFmpeg is distributed in the hope that it will be useful,
  12. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  14. * Lesser General Public License for more details.
  15. *
  16. * You should have received a copy of the GNU Lesser General Public
  17. * License along with FFmpeg; if not, write to the Free Software
  18. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19. */
  20. #ifndef AVFORMAT_SUBTITLES_H
  21. #define AVFORMAT_SUBTITLES_H
  22. #include <stdint.h>
  23. #include <stddef.h>
  24. #include "avformat.h"
  25. #include "libavutil/bprint.h"
  26. enum sub_sort {
  27. SUB_SORT_TS_POS = 0, ///< sort by timestamps, then position
  28. SUB_SORT_POS_TS, ///< sort by position, then timestamps
  29. };
  30. enum ff_utf_type {
  31. FF_UTF_8, // or other 8 bit encodings
  32. FF_UTF16LE,
  33. FF_UTF16BE,
  34. };
  35. typedef struct {
  36. int type;
  37. AVIOContext *pb;
  38. unsigned char buf[8];
  39. int buf_pos, buf_len;
  40. AVIOContext buf_pb;
  41. } FFTextReader;
  42. /**
  43. * Initialize the FFTextReader from the given AVIOContext. This function will
  44. * read some bytes from pb, and test for UTF-8 or UTF-16 BOMs. Further accesses
  45. * to FFTextReader will read more data from pb.
  46. * If s is not NULL, the user will be warned if a UTF-16 conversion takes place.
  47. *
  48. * The purpose of FFTextReader is to transparently convert read data to UTF-8
  49. * if the stream had a UTF-16 BOM.
  50. *
  51. * @param s Pointer to provide av_log context
  52. * @param r object which will be initialized
  53. * @param pb stream to read from (referenced as long as FFTextReader is in use)
  54. */
  55. void ff_text_init_avio(void *s, FFTextReader *r, AVIOContext *pb);
  56. /**
  57. * Similar to ff_text_init_avio(), but sets it up to read from a bounded buffer.
  58. *
  59. * @param r object which will be initialized
  60. * @param buf buffer to read from (referenced as long as FFTextReader is in use)
  61. * @param size size of buf
  62. */
  63. void ff_text_init_buf(FFTextReader *r, void *buf, size_t size);
  64. /**
  65. * Return the byte position of the next byte returned by ff_text_r8(). For
  66. * UTF-16 source streams, this will return the original position, but it will
  67. * be incorrect if a codepoint was only partially read with ff_text_r8().
  68. */
  69. int64_t ff_text_pos(FFTextReader *r);
  70. /**
  71. * Return the next byte. The return value is always 0 - 255. Returns 0 on EOF.
  72. * If the source stream is UTF-16, this reads from the stream converted to
  73. * UTF-8. On invalid UTF-16, 0 is returned.
  74. */
  75. int ff_text_r8(FFTextReader *r);
  76. /**
  77. * Return non-zero if EOF was reached.
  78. */
  79. int ff_text_eof(FFTextReader *r);
  80. /**
  81. * Like ff_text_r8(), but don't remove the byte from the buffer.
  82. */
  83. int ff_text_peek_r8(FFTextReader *r);
  84. /**
  85. * Read the given number of bytes (in UTF-8). On error or EOF, \0 bytes are
  86. * written.
  87. */
  88. void ff_text_read(FFTextReader *r, char *buf, size_t size);
  89. typedef struct {
  90. AVPacket *subs; ///< array of subtitles packets
  91. int nb_subs; ///< number of subtitles packets
  92. int allocated_size; ///< allocated size for subs
  93. int current_sub_idx; ///< current position for the read packet callback
  94. enum sub_sort sort; ///< sort method to use when finalizing subtitles
  95. } FFDemuxSubtitlesQueue;
  96. /**
  97. * Insert a new subtitle event.
  98. *
  99. * @param event the subtitle line, may not be zero terminated
  100. * @param len the length of the event (in strlen() sense, so without '\0')
  101. * @param merge set to 1 if the current event should be concatenated with the
  102. * previous one instead of adding a new entry, 0 otherwise
  103. */
  104. AVPacket *ff_subtitles_queue_insert(FFDemuxSubtitlesQueue *q,
  105. const uint8_t *event, int len, int merge);
  106. /**
  107. * Set missing durations and sort subtitles by PTS, and then byte position.
  108. */
  109. void ff_subtitles_queue_finalize(FFDemuxSubtitlesQueue *q);
  110. /**
  111. * Generic read_packet() callback for subtitles demuxers using this queue
  112. * system.
  113. */
  114. int ff_subtitles_queue_read_packet(FFDemuxSubtitlesQueue *q, AVPacket *pkt);
  115. /**
  116. * Update current_sub_idx to emulate a seek. Except the first parameter, it
  117. * matches AVInputFormat->read_seek2 prototypes.
  118. */
  119. int ff_subtitles_queue_seek(FFDemuxSubtitlesQueue *q, AVFormatContext *s, int stream_index,
  120. int64_t min_ts, int64_t ts, int64_t max_ts, int flags);
  121. /**
  122. * Remove and destroy all the subtitles packets.
  123. */
  124. void ff_subtitles_queue_clean(FFDemuxSubtitlesQueue *q);
  125. /**
  126. * SMIL helper to load next chunk ("<...>" or untagged content) in buf.
  127. *
  128. * @param c cached character, to avoid a backward seek
  129. */
  130. int ff_smil_extract_next_text_chunk(FFTextReader *tr, AVBPrint *buf, char *c);
  131. /**
  132. * SMIL helper to point on the value of an attribute in the given tag.
  133. *
  134. * @param s SMIL tag ("<...>")
  135. * @param attr the attribute to look for
  136. */
  137. const char *ff_smil_get_attr_ptr(const char *s, const char *attr);
  138. /**
  139. * @brief Same as ff_subtitles_read_text_chunk(), but read from an AVIOContext.
  140. */
  141. void ff_subtitles_read_chunk(AVIOContext *pb, AVBPrint *buf);
  142. /**
  143. * @brief Read a subtitles chunk from FFTextReader.
  144. *
  145. * A chunk is defined by a multiline "event", ending with a second line break.
  146. * The trailing line breaks are trimmed. CRLF are supported.
  147. * Example: "foo\r\nbar\r\n\r\nnext" will print "foo\r\nbar" into buf, and pb
  148. * will focus on the 'n' of the "next" string.
  149. *
  150. * @param tr I/O context
  151. * @param buf an initialized buf where the chunk is written
  152. *
  153. * @note buf is cleared before writing into it.
  154. */
  155. void ff_subtitles_read_text_chunk(FFTextReader *tr, AVBPrint *buf);
  156. /**
  157. * Get the number of characters to increment to jump to the next line, or to
  158. * the end of the string.
  159. * The function handles the following line breaks schemes:
  160. * LF, CRLF (MS), or standalone CR (old MacOS).
  161. */
  162. static av_always_inline int ff_subtitles_next_line(const char *ptr)
  163. {
  164. int n = strcspn(ptr, "\r\n");
  165. ptr += n;
  166. if (*ptr == '\r') {
  167. ptr++;
  168. n++;
  169. }
  170. if (*ptr == '\n')
  171. n++;
  172. return n;
  173. }
  174. /**
  175. * Read a line of text. Discards line ending characters.
  176. * The function handles the following line breaks schemes:
  177. * LF, CRLF (MS), or standalone CR (old MacOS).
  178. *
  179. * Returns the number of bytes written to buf. Always writes a terminating 0,
  180. * similar as with snprintf.
  181. *
  182. * @note returns a negative error code if a \0 byte is found
  183. */
  184. ptrdiff_t ff_subtitles_read_line(FFTextReader *tr, char *buf, size_t size);
  185. #endif /* AVFORMAT_SUBTITLES_H */