You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

542 lines
16KB

  1. /*
  2. * Sony OpenMG (OMA) demuxer
  3. *
  4. * Copyright (c) 2008, 2013 Maxim Poliakovski
  5. * 2008 Benjamin Larsson
  6. * 2011 David Goldwich
  7. *
  8. * This file is part of Libav.
  9. *
  10. * Libav is free software; you can redistribute it and/or
  11. * modify it under the terms of the GNU Lesser General Public
  12. * License as published by the Free Software Foundation; either
  13. * version 2.1 of the License, or (at your option) any later version.
  14. *
  15. * Libav is distributed in the hope that it will be useful,
  16. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  17. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  18. * Lesser General Public License for more details.
  19. *
  20. * You should have received a copy of the GNU Lesser General Public
  21. * License along with Libav; if not, write to the Free Software
  22. * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  23. */
  24. /**
  25. * @file
  26. * This is a demuxer for Sony OpenMG Music files
  27. *
  28. * Known file extensions: ".oma", "aa3"
  29. * The format of such files consists of three parts:
  30. * - "ea3" header carrying overall info and metadata. Except for starting with
  31. * "ea" instead of "ID", it's an ID3v2 header.
  32. * - "EA3" header is a Sony-specific header containing information about
  33. * the OpenMG file: codec type (usually ATRAC, can also be MP3 or WMA),
  34. * codec specific info (packet size, sample rate, channels and so on)
  35. * and DRM related info (file encryption, content id).
  36. * - Sound data organized in packets follow the EA3 header
  37. * (can be encrypted using the Sony DRM!).
  38. *
  39. * Supported decoders: ATRAC3, ATRAC3+, MP3, LPCM
  40. */
  41. #include <inttypes.h>
  42. #include "libavutil/channel_layout.h"
  43. #include "avformat.h"
  44. #include "internal.h"
  45. #include "libavutil/intreadwrite.h"
  46. #include "libavutil/des.h"
  47. #include "libavutil/mathematics.h"
  48. #include "oma.h"
  49. #include "pcm.h"
  50. #include "id3v2.h"
  51. static const uint64_t leaf_table[] = {
  52. 0xd79e8283acea4620, 0x7a9762f445afd0d8,
  53. 0x354d60a60b8c79f1, 0x584e1cde00b07aee,
  54. 0x1573cd93da7df623, 0x47f98d79620dd535
  55. };
  56. typedef struct OMAContext {
  57. uint64_t content_start;
  58. int encrypted;
  59. uint16_t k_size;
  60. uint16_t e_size;
  61. uint16_t i_size;
  62. uint16_t s_size;
  63. uint32_t rid;
  64. uint8_t r_val[24];
  65. uint8_t n_val[24];
  66. uint8_t m_val[8];
  67. uint8_t s_val[8];
  68. uint8_t sm_val[8];
  69. uint8_t e_val[8];
  70. uint8_t iv[8];
  71. struct AVDES *av_des;
  72. } OMAContext;
  73. static void hex_log(AVFormatContext *s, int level,
  74. const char *name, const uint8_t *value, int len)
  75. {
  76. char buf[33];
  77. len = FFMIN(len, 16);
  78. if (av_log_get_level() < level)
  79. return;
  80. ff_data_to_hex(buf, value, len, 1);
  81. buf[len << 1] = '\0';
  82. av_log(s, level, "%s: %s\n", name, buf);
  83. }
  84. static int kset(AVFormatContext *s, const uint8_t *r_val, const uint8_t *n_val,
  85. int len)
  86. {
  87. OMAContext *oc = s->priv_data;
  88. if (!r_val && !n_val)
  89. return -1;
  90. len = FFMIN(len, 16);
  91. /* use first 64 bits in the third round again */
  92. if (r_val) {
  93. if (r_val != oc->r_val) {
  94. memset(oc->r_val, 0, 24);
  95. memcpy(oc->r_val, r_val, len);
  96. }
  97. memcpy(&oc->r_val[16], r_val, 8);
  98. }
  99. if (n_val) {
  100. if (n_val != oc->n_val) {
  101. memset(oc->n_val, 0, 24);
  102. memcpy(oc->n_val, n_val, len);
  103. }
  104. memcpy(&oc->n_val[16], n_val, 8);
  105. }
  106. return 0;
  107. }
  108. #define OMA_RPROBE_M_VAL 48 + 1
  109. static int rprobe(AVFormatContext *s, uint8_t *enc_header, unsigned size,
  110. const uint8_t *r_val)
  111. {
  112. OMAContext *oc = s->priv_data;
  113. unsigned int pos;
  114. struct AVDES *av_des;
  115. if (!enc_header || !r_val ||
  116. size < OMA_ENC_HEADER_SIZE + oc->k_size + oc->e_size + oc->i_size ||
  117. size < OMA_RPROBE_M_VAL)
  118. return -1;
  119. av_des = av_des_alloc();
  120. if (!av_des)
  121. return AVERROR(ENOMEM);
  122. /* m_val */
  123. av_des_init(av_des, r_val, 192, 1);
  124. av_des_crypt(av_des, oc->m_val, &enc_header[48], 1, NULL, 1);
  125. /* s_val */
  126. av_des_init(av_des, oc->m_val, 64, 0);
  127. av_des_crypt(av_des, oc->s_val, NULL, 1, NULL, 0);
  128. /* sm_val */
  129. pos = OMA_ENC_HEADER_SIZE + oc->k_size + oc->e_size;
  130. av_des_init(av_des, oc->s_val, 64, 0);
  131. av_des_mac(av_des, oc->sm_val, &enc_header[pos], (oc->i_size >> 3));
  132. pos += oc->i_size;
  133. av_free(av_des);
  134. return memcmp(&enc_header[pos], oc->sm_val, 8) ? -1 : 0;
  135. }
  136. static int nprobe(AVFormatContext *s, uint8_t *enc_header, unsigned size,
  137. const uint8_t *n_val)
  138. {
  139. OMAContext *oc = s->priv_data;
  140. uint64_t pos;
  141. uint32_t taglen, datalen;
  142. struct AVDES *av_des;
  143. if (!enc_header || !n_val ||
  144. size < OMA_ENC_HEADER_SIZE + oc->k_size + 4)
  145. return -1;
  146. pos = OMA_ENC_HEADER_SIZE + oc->k_size;
  147. if (!memcmp(&enc_header[pos], "EKB ", 4))
  148. pos += 32;
  149. if (size < pos + 44)
  150. return -1;
  151. if (AV_RB32(&enc_header[pos]) != oc->rid)
  152. av_log(s, AV_LOG_DEBUG, "Mismatching RID\n");
  153. taglen = AV_RB32(&enc_header[pos + 32]);
  154. datalen = AV_RB32(&enc_header[pos + 36]) >> 4;
  155. pos += 44;
  156. if (size - pos < taglen)
  157. return -1;
  158. pos += taglen;
  159. if (datalen << 4 > size - pos)
  160. return -1;
  161. av_des = av_des_alloc();
  162. if (!av_des)
  163. return AVERROR(ENOMEM);
  164. av_des_init(av_des, n_val, 192, 1);
  165. while (datalen-- > 0) {
  166. av_des_crypt(av_des, oc->r_val, &enc_header[pos], 2, NULL, 1);
  167. kset(s, oc->r_val, NULL, 16);
  168. if (!rprobe(s, enc_header, size, oc->r_val)) {
  169. av_free(av_des);
  170. return 0;
  171. }
  172. pos += 16;
  173. }
  174. av_free(av_des);
  175. return -1;
  176. }
  177. static int decrypt_init(AVFormatContext *s, ID3v2ExtraMeta *em, uint8_t *header)
  178. {
  179. OMAContext *oc = s->priv_data;
  180. ID3v2ExtraMetaGEOB *geob = NULL;
  181. uint8_t *gdata;
  182. oc->encrypted = 1;
  183. av_log(s, AV_LOG_INFO, "File is encrypted\n");
  184. /* find GEOB metadata */
  185. while (em) {
  186. if (!strcmp(em->tag, "GEOB") &&
  187. (geob = em->data) &&
  188. (!strcmp(geob->description, "OMG_LSI") ||
  189. !strcmp(geob->description, "OMG_BKLSI"))) {
  190. break;
  191. }
  192. em = em->next;
  193. }
  194. if (!em) {
  195. av_log(s, AV_LOG_ERROR, "No encryption header found\n");
  196. return AVERROR_INVALIDDATA;
  197. }
  198. if (geob->datasize < 64) {
  199. av_log(s, AV_LOG_ERROR,
  200. "Invalid GEOB data size: %"PRIu32"\n", geob->datasize);
  201. return AVERROR_INVALIDDATA;
  202. }
  203. gdata = geob->data;
  204. if (AV_RB16(gdata) != 1)
  205. av_log(s, AV_LOG_WARNING, "Unknown version in encryption header\n");
  206. oc->k_size = AV_RB16(&gdata[2]);
  207. oc->e_size = AV_RB16(&gdata[4]);
  208. oc->i_size = AV_RB16(&gdata[6]);
  209. oc->s_size = AV_RB16(&gdata[8]);
  210. if (memcmp(&gdata[OMA_ENC_HEADER_SIZE], "KEYRING ", 12)) {
  211. av_log(s, AV_LOG_ERROR, "Invalid encryption header\n");
  212. return AVERROR_INVALIDDATA;
  213. }
  214. if (OMA_ENC_HEADER_SIZE + oc->k_size + oc->e_size + oc->i_size + 8 > geob->datasize ||
  215. OMA_ENC_HEADER_SIZE + 48 > geob->datasize) {
  216. av_log(s, AV_LOG_ERROR, "Too little GEOB data\n");
  217. return AVERROR_INVALIDDATA;
  218. }
  219. oc->rid = AV_RB32(&gdata[OMA_ENC_HEADER_SIZE + 28]);
  220. av_log(s, AV_LOG_DEBUG, "RID: %.8"PRIx32"\n", oc->rid);
  221. memcpy(oc->iv, &header[0x58], 8);
  222. hex_log(s, AV_LOG_DEBUG, "IV", oc->iv, 8);
  223. hex_log(s, AV_LOG_DEBUG, "CBC-MAC",
  224. &gdata[OMA_ENC_HEADER_SIZE + oc->k_size + oc->e_size + oc->i_size],
  225. 8);
  226. if (s->keylen > 0) {
  227. kset(s, s->key, s->key, s->keylen);
  228. }
  229. if (!memcmp(oc->r_val, (const uint8_t[8]){0}, 8) ||
  230. rprobe(s, gdata, geob->datasize, oc->r_val) < 0 &&
  231. nprobe(s, gdata, geob->datasize, oc->n_val) < 0) {
  232. int i;
  233. for (i = 0; i < FF_ARRAY_ELEMS(leaf_table); i += 2) {
  234. uint8_t buf[16];
  235. AV_WL64(buf, leaf_table[i]);
  236. AV_WL64(&buf[8], leaf_table[i + 1]);
  237. kset(s, buf, buf, 16);
  238. if (!rprobe(s, gdata, geob->datasize, oc->r_val) ||
  239. !nprobe(s, gdata, geob->datasize, oc->n_val))
  240. break;
  241. }
  242. if (i >= FF_ARRAY_ELEMS(leaf_table)) {
  243. av_log(s, AV_LOG_ERROR, "Invalid key\n");
  244. return AVERROR_INVALIDDATA;
  245. }
  246. }
  247. oc->av_des = av_des_alloc();
  248. if (!oc->av_des)
  249. return AVERROR(ENOMEM);
  250. /* e_val */
  251. av_des_init(oc->av_des, oc->m_val, 64, 0);
  252. av_des_crypt(oc->av_des, oc->e_val,
  253. &gdata[OMA_ENC_HEADER_SIZE + 40], 1, NULL, 0);
  254. hex_log(s, AV_LOG_DEBUG, "EK", oc->e_val, 8);
  255. /* init e_val */
  256. av_des_init(oc->av_des, oc->e_val, 64, 1);
  257. return 0;
  258. }
  259. static int oma_read_header(AVFormatContext *s)
  260. {
  261. int ret, framesize, jsflag, samplerate;
  262. uint32_t codec_params, channel_id;
  263. int16_t eid;
  264. uint8_t buf[EA3_HEADER_SIZE];
  265. uint8_t *edata;
  266. AVStream *st;
  267. ID3v2ExtraMeta *extra_meta = NULL;
  268. OMAContext *oc = s->priv_data;
  269. ff_id3v2_read(s, ID3v2_EA3_MAGIC, &extra_meta);
  270. ret = avio_read(s->pb, buf, EA3_HEADER_SIZE);
  271. if (ret < EA3_HEADER_SIZE)
  272. return -1;
  273. if (memcmp(buf, ((const uint8_t[]){'E', 'A', '3'}), 3) ||
  274. buf[4] != 0 || buf[5] != EA3_HEADER_SIZE) {
  275. av_log(s, AV_LOG_ERROR, "Couldn't find the EA3 header !\n");
  276. return AVERROR_INVALIDDATA;
  277. }
  278. oc->content_start = avio_tell(s->pb);
  279. /* encrypted file */
  280. eid = AV_RB16(&buf[6]);
  281. if (eid != -1 && eid != -128 && decrypt_init(s, extra_meta, buf) < 0) {
  282. ff_id3v2_free_extra_meta(&extra_meta);
  283. return -1;
  284. }
  285. ff_id3v2_free_extra_meta(&extra_meta);
  286. codec_params = AV_RB24(&buf[33]);
  287. st = avformat_new_stream(s, NULL);
  288. if (!st)
  289. return AVERROR(ENOMEM);
  290. st->start_time = 0;
  291. st->codecpar->codec_type = AVMEDIA_TYPE_AUDIO;
  292. st->codecpar->codec_tag = buf[32];
  293. st->codecpar->codec_id = ff_codec_get_id(ff_oma_codec_tags,
  294. st->codecpar->codec_tag);
  295. switch (buf[32]) {
  296. case OMA_CODECID_ATRAC3:
  297. samplerate = ff_oma_srate_tab[(codec_params >> 13) & 7] * 100;
  298. if (!samplerate) {
  299. av_log(s, AV_LOG_ERROR, "Unsupported sample rate\n");
  300. return AVERROR_INVALIDDATA;
  301. }
  302. if (samplerate != 44100)
  303. avpriv_request_sample(s, "Sample rate %d", samplerate);
  304. framesize = (codec_params & 0x3FF) * 8;
  305. /* get stereo coding mode, 1 for joint-stereo */
  306. jsflag = (codec_params >> 17) & 1;
  307. st->codecpar->channels = 2;
  308. st->codecpar->channel_layout = AV_CH_LAYOUT_STEREO;
  309. st->codecpar->sample_rate = samplerate;
  310. st->codecpar->bit_rate = st->codecpar->sample_rate * framesize * 8 / 1024;
  311. /* fake the ATRAC3 extradata
  312. * (wav format, makes stream copy to wav work) */
  313. st->codecpar->extradata_size = 14;
  314. edata = av_mallocz(14 + AV_INPUT_BUFFER_PADDING_SIZE);
  315. if (!edata)
  316. return AVERROR(ENOMEM);
  317. st->codecpar->extradata = edata;
  318. AV_WL16(&edata[0], 1); // always 1
  319. AV_WL32(&edata[2], samplerate); // samples rate
  320. AV_WL16(&edata[6], jsflag); // coding mode
  321. AV_WL16(&edata[8], jsflag); // coding mode
  322. AV_WL16(&edata[10], 1); // always 1
  323. // AV_WL16(&edata[12], 0); // always 0
  324. avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
  325. break;
  326. case OMA_CODECID_ATRAC3P:
  327. channel_id = (codec_params >> 10) & 7;
  328. if (!channel_id) {
  329. av_log(s, AV_LOG_ERROR,
  330. "Invalid ATRAC-X channel id: %"PRIu32"\n", channel_id);
  331. return AVERROR_INVALIDDATA;
  332. }
  333. st->codecpar->channel_layout = ff_oma_chid_to_native_layout[channel_id - 1];
  334. st->codecpar->channels = ff_oma_chid_to_num_channels[channel_id - 1];
  335. framesize = ((codec_params & 0x3FF) * 8) + 8;
  336. samplerate = ff_oma_srate_tab[(codec_params >> 13) & 7] * 100;
  337. if (!samplerate) {
  338. av_log(s, AV_LOG_ERROR, "Unsupported sample rate\n");
  339. return AVERROR_INVALIDDATA;
  340. }
  341. st->codecpar->sample_rate = samplerate;
  342. st->codecpar->bit_rate = samplerate * framesize * 8 / 2048;
  343. avpriv_set_pts_info(st, 64, 1, samplerate);
  344. break;
  345. case OMA_CODECID_MP3:
  346. st->need_parsing = AVSTREAM_PARSE_FULL;
  347. framesize = 1024;
  348. break;
  349. case OMA_CODECID_LPCM:
  350. /* PCM 44.1 kHz 16 bit stereo big-endian */
  351. st->codecpar->channels = 2;
  352. st->codecpar->channel_layout = AV_CH_LAYOUT_STEREO;
  353. st->codecpar->sample_rate = 44100;
  354. framesize = 1024;
  355. /* bit rate = sample rate x PCM block align (= 4) x 8 */
  356. st->codecpar->bit_rate = st->codecpar->sample_rate * 32;
  357. st->codecpar->bits_per_coded_sample =
  358. av_get_bits_per_sample(st->codecpar->codec_id);
  359. avpriv_set_pts_info(st, 64, 1, st->codecpar->sample_rate);
  360. break;
  361. default:
  362. av_log(s, AV_LOG_ERROR, "Unsupported codec %d!\n", buf[32]);
  363. return AVERROR(ENOSYS);
  364. }
  365. st->codecpar->block_align = framesize;
  366. return 0;
  367. }
  368. static int oma_read_packet(AVFormatContext *s, AVPacket *pkt)
  369. {
  370. OMAContext *oc = s->priv_data;
  371. AVStream *st = s->streams[0];
  372. int packet_size = st->codecpar->block_align;
  373. int byte_rate = st->codecpar->bit_rate >> 3;
  374. int64_t pos = avio_tell(s->pb);
  375. int ret = av_get_packet(s->pb, pkt, packet_size);
  376. if (ret < packet_size)
  377. pkt->flags |= AV_PKT_FLAG_CORRUPT;
  378. if (ret < 0)
  379. return ret;
  380. if (!ret)
  381. return AVERROR_EOF;
  382. pkt->stream_index = 0;
  383. if (pos > 0) {
  384. pkt->pts =
  385. pkt->dts = av_rescale(pos, st->time_base.den,
  386. byte_rate * (int64_t)st->time_base.num);
  387. }
  388. if (oc->encrypted) {
  389. /* previous unencrypted block saved in IV for
  390. * the next packet (CBC mode) */
  391. if (ret == packet_size)
  392. av_des_crypt(oc->av_des, pkt->data, pkt->data,
  393. (packet_size >> 3), oc->iv, 1);
  394. else
  395. memset(oc->iv, 0, 8);
  396. }
  397. return ret;
  398. }
  399. static int oma_read_probe(AVProbeData *p)
  400. {
  401. const uint8_t *buf = p->buf;
  402. unsigned tag_len = 0;
  403. if (p->buf_size >= ID3v2_HEADER_SIZE && ff_id3v2_match(buf, ID3v2_EA3_MAGIC))
  404. tag_len = ff_id3v2_tag_len(buf);
  405. /* This check cannot overflow as tag_len has at most 28 bits */
  406. if (p->buf_size < tag_len + 5)
  407. /* EA3 header comes late, might be outside of the probe buffer */
  408. return tag_len ? AVPROBE_SCORE_EXTENSION : 0;
  409. buf += tag_len;
  410. if (!memcmp(buf, "EA3", 3) && !buf[4] && buf[5] == EA3_HEADER_SIZE)
  411. return AVPROBE_SCORE_MAX;
  412. else
  413. return 0;
  414. }
  415. static int oma_read_seek(struct AVFormatContext *s,
  416. int stream_index, int64_t timestamp, int flags)
  417. {
  418. OMAContext *oc = s->priv_data;
  419. int err = ff_pcm_read_seek(s, stream_index, timestamp, flags);
  420. if (!oc->encrypted)
  421. return err;
  422. /* readjust IV for CBC */
  423. if (err || avio_tell(s->pb) < oc->content_start)
  424. goto wipe;
  425. if ((err = avio_seek(s->pb, -8, SEEK_CUR)) < 0)
  426. goto wipe;
  427. if ((err = avio_read(s->pb, oc->iv, 8)) < 8) {
  428. if (err >= 0)
  429. err = AVERROR_EOF;
  430. goto wipe;
  431. }
  432. return 0;
  433. wipe:
  434. memset(oc->iv, 0, 8);
  435. return err;
  436. }
  437. static int oma_read_close(AVFormatContext *s)
  438. {
  439. OMAContext *oc = s->priv_data;
  440. av_free(oc->av_des);
  441. return 0;
  442. }
  443. AVInputFormat ff_oma_demuxer = {
  444. .name = "oma",
  445. .long_name = NULL_IF_CONFIG_SMALL("Sony OpenMG audio"),
  446. .priv_data_size = sizeof(OMAContext),
  447. .read_probe = oma_read_probe,
  448. .read_header = oma_read_header,
  449. .read_packet = oma_read_packet,
  450. .read_seek = oma_read_seek,
  451. .read_close = oma_read_close,
  452. .flags = AVFMT_GENERIC_INDEX,
  453. .extensions = "oma,omg,aa3",
  454. .codec_tag = (const AVCodecTag* const []){ff_oma_codec_tags, 0},
  455. };