You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

451 lines
13KB

  1. /*
  2. * Sony OpenMG (OMA) demuxer
  3. *
  4. * Copyright (c) 2008 Maxim Poliakovski
  5. * 2008 Benjamin Larsson
  6. * 2011 David Goldwich
  7. *
  8. * This file is part of FFmpeg.
  9. *
  10. * FFmpeg is free software; you can redistribute it and/or
  11. * modify it under the terms of the GNU Lesser General Public
  12. * License as published by the Free Software Foundation; either
  13. * version 2.1 of the License, or (at your option) any later version.
  14. *
  15. * FFmpeg is distributed in the hope that it will be useful,
  16. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  17. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  18. * Lesser General Public License for more details.
  19. *
  20. * You should have received a copy of the GNU Lesser General Public
  21. * License along with FFmpeg; if not, write to the Free Software
  22. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  23. */
  24. /**
  25. * @file
  26. * This is a demuxer for Sony OpenMG Music files
  27. *
  28. * Known file extensions: ".oma", "aa3"
  29. * The format of such files consists of three parts:
  30. * - "ea3" header carrying overall info and metadata. Except for starting with
  31. * "ea" instead of "ID", it's an ID3v2 header.
  32. * - "EA3" header is a Sony-specific header containing information about
  33. * the OpenMG file: codec type (usually ATRAC, can also be MP3 or WMA),
  34. * codec specific info (packet size, sample rate, channels and so on)
  35. * and DRM related info (file encryption, content id).
  36. * - Sound data organized in packets follow the EA3 header
  37. * (can be encrypted using the Sony DRM!).
  38. *
  39. * CODEC SUPPORT: Only ATRAC3 codec is currently supported!
  40. */
  41. #include "avformat.h"
  42. #include "internal.h"
  43. #include "libavutil/intreadwrite.h"
  44. #include "libavutil/des.h"
  45. #include "pcm.h"
  46. #include "riff.h"
  47. #include "id3v2.h"
  48. #define EA3_HEADER_SIZE 96
  49. #define ID3v2_EA3_MAGIC "ea3"
  50. #define OMA_ENC_HEADER_SIZE 16
  51. enum {
  52. OMA_CODECID_ATRAC3 = 0,
  53. OMA_CODECID_ATRAC3P = 1,
  54. OMA_CODECID_MP3 = 3,
  55. OMA_CODECID_LPCM = 4,
  56. OMA_CODECID_WMA = 5,
  57. };
  58. static const AVCodecTag codec_oma_tags[] = {
  59. { CODEC_ID_ATRAC3, OMA_CODECID_ATRAC3 },
  60. { CODEC_ID_ATRAC3P, OMA_CODECID_ATRAC3P },
  61. { CODEC_ID_MP3, OMA_CODECID_MP3 },
  62. };
  63. static const uint64_t leaf_table[] = {
  64. 0xd79e8283acea4620, 0x7a9762f445afd0d8,
  65. 0x354d60a60b8c79f1, 0x584e1cde00b07aee,
  66. 0x1573cd93da7df623, 0x47f98d79620dd535
  67. };
  68. typedef struct OMAContext {
  69. uint64_t content_start;
  70. int encrypted;
  71. uint16_t k_size;
  72. uint16_t e_size;
  73. uint16_t i_size;
  74. uint16_t s_size;
  75. uint32_t rid;
  76. uint8_t r_val[24];
  77. uint8_t n_val[24];
  78. uint8_t m_val[8];
  79. uint8_t s_val[8];
  80. uint8_t sm_val[8];
  81. uint8_t e_val[8];
  82. uint8_t iv[8];
  83. struct AVDES av_des;
  84. } OMAContext;
  85. static void hex_log(AVFormatContext *s, int level, const char *name, const uint8_t *value, int len)
  86. {
  87. char buf[33];
  88. len = FFMIN(len, 16);
  89. if (av_log_get_level() < level)
  90. return;
  91. ff_data_to_hex(buf, value, len, 1);
  92. buf[len<<1] = '\0';
  93. av_log(s, level, "%s: %s\n", name, buf);
  94. }
  95. static int kset(AVFormatContext *s, const uint8_t *r_val, const uint8_t *n_val, int len)
  96. {
  97. OMAContext *oc = s->priv_data;
  98. if (!r_val && !n_val)
  99. return -1;
  100. len = FFMIN(len, 16);
  101. /* use first 64 bits in the third round again */
  102. if (r_val) {
  103. if (r_val != oc->r_val) {
  104. memset(oc->r_val, 0, 24);
  105. memcpy(oc->r_val, r_val, len);
  106. }
  107. memcpy(&oc->r_val[16], r_val, 8);
  108. }
  109. if (n_val) {
  110. if (n_val != oc->n_val) {
  111. memset(oc->n_val, 0, 24);
  112. memcpy(oc->n_val, n_val, len);
  113. }
  114. memcpy(&oc->n_val[16], n_val, 8);
  115. }
  116. return 0;
  117. }
  118. static int rprobe(AVFormatContext *s, uint8_t *enc_header, const uint8_t *r_val)
  119. {
  120. OMAContext *oc = s->priv_data;
  121. unsigned int pos;
  122. struct AVDES av_des;
  123. if (!enc_header || !r_val)
  124. return -1;
  125. /* m_val */
  126. av_des_init(&av_des, r_val, 192, 1);
  127. av_des_crypt(&av_des, oc->m_val, &enc_header[48], 1, NULL, 1);
  128. /* s_val */
  129. av_des_init(&av_des, oc->m_val, 64, 0);
  130. av_des_crypt(&av_des, oc->s_val, NULL, 1, NULL, 0);
  131. /* sm_val */
  132. pos = OMA_ENC_HEADER_SIZE + oc->k_size + oc->e_size;
  133. av_des_init(&av_des, oc->s_val, 64, 0);
  134. av_des_mac(&av_des, oc->sm_val, &enc_header[pos], (oc->i_size >> 3));
  135. pos += oc->i_size;
  136. return memcmp(&enc_header[pos], oc->sm_val, 8) ? -1 : 0;
  137. }
  138. static int nprobe(AVFormatContext *s, uint8_t *enc_header, int size, const uint8_t *n_val)
  139. {
  140. OMAContext *oc = s->priv_data;
  141. uint32_t pos, taglen, datalen;
  142. struct AVDES av_des;
  143. if (!enc_header || !n_val)
  144. return -1;
  145. pos = OMA_ENC_HEADER_SIZE + oc->k_size;
  146. if (!memcmp(&enc_header[pos], "EKB ", 4))
  147. pos += 32;
  148. if (AV_RB32(&enc_header[pos]) != oc->rid)
  149. av_log(s, AV_LOG_DEBUG, "Mismatching RID\n");
  150. taglen = AV_RB32(&enc_header[pos+32]);
  151. datalen = AV_RB32(&enc_header[pos+36]) >> 4;
  152. if(taglen + (((uint64_t)datalen)<<4) + 44 > size)
  153. return -1;
  154. pos += 44 + taglen;
  155. av_des_init(&av_des, n_val, 192, 1);
  156. while (datalen-- > 0) {
  157. av_des_crypt(&av_des, oc->r_val, &enc_header[pos], 2, NULL, 1);
  158. kset(s, oc->r_val, NULL, 16);
  159. if (!rprobe(s, enc_header, oc->r_val))
  160. return 0;
  161. pos += 16;
  162. }
  163. return -1;
  164. }
  165. static int decrypt_init(AVFormatContext *s, ID3v2ExtraMeta *em, uint8_t *header)
  166. {
  167. OMAContext *oc = s->priv_data;
  168. ID3v2ExtraMetaGEOB *geob = NULL;
  169. uint8_t *gdata;
  170. oc->encrypted = 1;
  171. av_log(s, AV_LOG_INFO, "File is encrypted\n");
  172. /* find GEOB metadata */
  173. while (em) {
  174. if (!strcmp(em->tag, "GEOB") &&
  175. (geob = em->data) &&
  176. !strcmp(geob->description, "OMG_LSI") ||
  177. !strcmp(geob->description, "OMG_BKLSI")) {
  178. break;
  179. }
  180. em = em->next;
  181. }
  182. if (!em) {
  183. av_log(s, AV_LOG_ERROR, "No encryption header found\n");
  184. return -1;
  185. }
  186. if (geob->datasize < 64) {
  187. av_log(s, AV_LOG_ERROR, "Invalid GEOB data size: %u\n", geob->datasize);
  188. return -1;
  189. }
  190. gdata = geob->data;
  191. if (AV_RB16(gdata) != 1)
  192. av_log(s, AV_LOG_WARNING, "Unknown version in encryption header\n");
  193. oc->k_size = AV_RB16(&gdata[2]);
  194. oc->e_size = AV_RB16(&gdata[4]);
  195. oc->i_size = AV_RB16(&gdata[6]);
  196. oc->s_size = AV_RB16(&gdata[8]);
  197. if (memcmp(&gdata[OMA_ENC_HEADER_SIZE], "KEYRING ", 12)) {
  198. av_log(s, AV_LOG_ERROR, "Invalid encryption header\n");
  199. return -1;
  200. }
  201. oc->rid = AV_RB32(&gdata[OMA_ENC_HEADER_SIZE + 28]);
  202. av_log(s, AV_LOG_DEBUG, "RID: %.8x\n", oc->rid);
  203. memcpy(oc->iv, &header[0x58], 8);
  204. hex_log(s, AV_LOG_DEBUG, "IV", oc->iv, 8);
  205. hex_log(s, AV_LOG_DEBUG, "CBC-MAC", &gdata[OMA_ENC_HEADER_SIZE+oc->k_size+oc->e_size+oc->i_size], 8);
  206. if (s->keylen > 0) {
  207. kset(s, s->key, s->key, s->keylen);
  208. }
  209. if (!memcmp(oc->r_val, (const uint8_t[8]){0}, 8) ||
  210. rprobe(s, gdata, oc->r_val) < 0 &&
  211. nprobe(s, gdata, geob->datasize, oc->n_val) < 0) {
  212. int i;
  213. for (i = 0; i < sizeof(leaf_table); i += 2) {
  214. uint8_t buf[16];
  215. AV_WL64(buf, leaf_table[i]);
  216. AV_WL64(&buf[8], leaf_table[i+1]);
  217. kset(s, buf, buf, 16);
  218. if (!rprobe(s, gdata, oc->r_val) || !nprobe(s, gdata, geob->datasize, oc->n_val))
  219. break;
  220. }
  221. if (i >= sizeof(leaf_table)) {
  222. av_log(s, AV_LOG_ERROR, "Invalid key\n");
  223. return -1;
  224. }
  225. }
  226. /* e_val */
  227. av_des_init(&oc->av_des, oc->m_val, 64, 0);
  228. av_des_crypt(&oc->av_des, oc->e_val, &gdata[OMA_ENC_HEADER_SIZE + 40], 1, NULL, 0);
  229. hex_log(s, AV_LOG_DEBUG, "EK", oc->e_val, 8);
  230. /* init e_val */
  231. av_des_init(&oc->av_des, oc->e_val, 64, 1);
  232. return 0;
  233. }
  234. static int oma_read_header(AVFormatContext *s,
  235. AVFormatParameters *ap)
  236. {
  237. static const uint16_t srate_tab[6] = {320,441,480,882,960,0};
  238. int ret, framesize, jsflag, samplerate;
  239. uint32_t codec_params;
  240. int16_t eid;
  241. uint8_t buf[EA3_HEADER_SIZE];
  242. uint8_t *edata;
  243. AVStream *st;
  244. ID3v2ExtraMeta *extra_meta = NULL;
  245. OMAContext *oc = s->priv_data;
  246. ff_id3v2_read_all(s, ID3v2_EA3_MAGIC, &extra_meta);
  247. ret = avio_read(s->pb, buf, EA3_HEADER_SIZE);
  248. if (ret < EA3_HEADER_SIZE)
  249. return -1;
  250. if (memcmp(buf, ((const uint8_t[]){'E', 'A', '3'}),3) || buf[4] != 0 || buf[5] != EA3_HEADER_SIZE) {
  251. av_log(s, AV_LOG_ERROR, "Couldn't find the EA3 header !\n");
  252. return -1;
  253. }
  254. oc->content_start = avio_tell(s->pb);
  255. /* encrypted file */
  256. eid = AV_RB16(&buf[6]);
  257. if (eid != -1 && eid != -128 && decrypt_init(s, extra_meta, buf) < 0) {
  258. ff_id3v2_free_extra_meta(&extra_meta);
  259. return -1;
  260. }
  261. ff_id3v2_free_extra_meta(&extra_meta);
  262. codec_params = AV_RB24(&buf[33]);
  263. st = avformat_new_stream(s, NULL);
  264. if (!st)
  265. return AVERROR(ENOMEM);
  266. st->start_time = 0;
  267. st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
  268. st->codec->codec_tag = buf[32];
  269. st->codec->codec_id = ff_codec_get_id(codec_oma_tags, st->codec->codec_tag);
  270. switch (buf[32]) {
  271. case OMA_CODECID_ATRAC3:
  272. samplerate = srate_tab[(codec_params >> 13) & 7]*100;
  273. if (samplerate != 44100)
  274. av_log_ask_for_sample(s, "Unsupported sample rate: %d\n",
  275. samplerate);
  276. framesize = (codec_params & 0x3FF) * 8;
  277. jsflag = (codec_params >> 17) & 1; /* get stereo coding mode, 1 for joint-stereo */
  278. st->codec->channels = 2;
  279. st->codec->sample_rate = samplerate;
  280. st->codec->bit_rate = st->codec->sample_rate * framesize * 8 / 1024;
  281. /* fake the atrac3 extradata (wav format, makes stream copy to wav work) */
  282. st->codec->extradata_size = 14;
  283. edata = av_mallocz(14 + FF_INPUT_BUFFER_PADDING_SIZE);
  284. if (!edata)
  285. return AVERROR(ENOMEM);
  286. st->codec->extradata = edata;
  287. AV_WL16(&edata[0], 1); // always 1
  288. AV_WL32(&edata[2], samplerate); // samples rate
  289. AV_WL16(&edata[6], jsflag); // coding mode
  290. AV_WL16(&edata[8], jsflag); // coding mode
  291. AV_WL16(&edata[10], 1); // always 1
  292. // AV_WL16(&edata[12], 0); // always 0
  293. avpriv_set_pts_info(st, 64, 1, st->codec->sample_rate);
  294. break;
  295. case OMA_CODECID_ATRAC3P:
  296. st->codec->channels = (codec_params >> 10) & 7;
  297. framesize = ((codec_params & 0x3FF) * 8) + 8;
  298. st->codec->sample_rate = srate_tab[(codec_params >> 13) & 7]*100;
  299. st->codec->bit_rate = st->codec->sample_rate * framesize * 8 / 1024;
  300. avpriv_set_pts_info(st, 64, 1, st->codec->sample_rate);
  301. av_log(s, AV_LOG_ERROR, "Unsupported codec ATRAC3+!\n");
  302. break;
  303. case OMA_CODECID_MP3:
  304. st->need_parsing = AVSTREAM_PARSE_FULL;
  305. framesize = 1024;
  306. break;
  307. default:
  308. av_log(s, AV_LOG_ERROR, "Unsupported codec %d!\n",buf[32]);
  309. return -1;
  310. }
  311. st->codec->block_align = framesize;
  312. return 0;
  313. }
  314. static int oma_read_packet(AVFormatContext *s, AVPacket *pkt)
  315. {
  316. OMAContext *oc = s->priv_data;
  317. int packet_size = s->streams[0]->codec->block_align;
  318. int ret = av_get_packet(s->pb, pkt, packet_size);
  319. if (ret <= 0)
  320. return AVERROR(EIO);
  321. pkt->stream_index = 0;
  322. if (oc->encrypted) {
  323. /* previous unencrypted block saved in IV for the next packet (CBC mode) */
  324. av_des_crypt(&oc->av_des, pkt->data, pkt->data, (packet_size >> 3), oc->iv, 1);
  325. }
  326. return ret;
  327. }
  328. static int oma_read_probe(AVProbeData *p)
  329. {
  330. const uint8_t *buf;
  331. unsigned tag_len = 0;
  332. buf = p->buf;
  333. /* version must be 3 and flags byte zero */
  334. if (ff_id3v2_match(buf, ID3v2_EA3_MAGIC) && buf[3] == 3 && !buf[4])
  335. tag_len = ff_id3v2_tag_len(buf);
  336. // This check cannot overflow as tag_len has at most 28 bits
  337. if (p->buf_size < tag_len + 5)
  338. return 0;
  339. buf += tag_len;
  340. if (!memcmp(buf, "EA3", 3) && !buf[4] && buf[5] == EA3_HEADER_SIZE)
  341. return AVPROBE_SCORE_MAX;
  342. else
  343. return 0;
  344. }
  345. static int oma_read_seek(struct AVFormatContext *s, int stream_index, int64_t timestamp, int flags)
  346. {
  347. OMAContext *oc = s->priv_data;
  348. pcm_read_seek(s, stream_index, timestamp, flags);
  349. if (oc->encrypted) {
  350. /* readjust IV for CBC */
  351. int64_t pos = avio_tell(s->pb);
  352. if (pos < oc->content_start)
  353. memset(oc->iv, 0, 8);
  354. else {
  355. if (avio_seek(s->pb, -8, SEEK_CUR) < 0 || avio_read(s->pb, oc->iv, 8) < 8) {
  356. memset(oc->iv, 0, 8);
  357. return -1;
  358. }
  359. }
  360. }
  361. return 0;
  362. }
  363. AVInputFormat ff_oma_demuxer = {
  364. .name = "oma",
  365. .long_name = NULL_IF_CONFIG_SMALL("Sony OpenMG audio"),
  366. .priv_data_size = sizeof(OMAContext),
  367. .read_probe = oma_read_probe,
  368. .read_header = oma_read_header,
  369. .read_packet = oma_read_packet,
  370. .read_seek = oma_read_seek,
  371. .flags = AVFMT_GENERIC_INDEX,
  372. .extensions = "oma,omg,aa3",
  373. .codec_tag = (const AVCodecTag* const []){codec_oma_tags, 0},
  374. };