MP4音频解码信息

文章转载自:http://blog.csdn.net/flyingqr/archive/2010/02/02/5282600.aspx 版权归原作者,编辑:小乙哥

MP4文件格式分为头部和数据两部分,头部是由许多被称作Atom的结构单元嵌套或排列而成,数据部分则完全为实际数据不包含元信息,因此具体解码时音视频帧的位置和大小都要在头部获取。详细内容见以下链接:
http://wqyuwss.52rd.net
这里总结下音频解码信息获取的一些经验,当然详细内容需要查看quick time file format的文档。
MP4的音频解码信息保存在如下嵌套的Atom中,{moov{mdia{minf{smhd{stbl{stsd}}}}}}
stsd可能包括多个音频信息的描述,结构如下:

typedef struct stsdtable
{
    unsigned int size;//Atom大小
    char format[4];//音频编码格式
    int res1;
    int ref;
    short version;//版本
    short pad1;
    int pad2;
    short channels;//声道
    short bitspersample;
    short compress_id;
    short res2;
    short samplerate1;//采样率
    short samplerate2;
    //{if(version==1)

        int sampleperpacket;
        int bytesperpacket;
        int bytesperframe;
        int bytespersample;
    //}

} stsdtable;

其中format对应音频编码格式:
PCM_S32BE,  in32
PCM_S32LE,  in32
PCM_S24BE,  in24
PCM_S24LE,  in24
PCM_S16BE,  twos // 16 bits //
PCM_S16LE,  sowt // 
PCM_S16LE,  lpcm
PCM_F32BE,  fl32
PCM_F64BE,  fl64
PCM_S8,     sowt
PCM_U8,     raw  // 8 bits unsigned
PCM_U8,     NONE // uncompressed
PCM_MULAW,  ulaw //
PCM_ALAW,   alaw //
ADPCM_IMA_QT, ima4 // IMA-4 ADPCM //
MACE3,      MAC3 // Macintosh Audio Compression and Expansion 3:1 ///
MACE6,      MAC6 // Macintosh Audio Compression and Expansion 6:1 //
MP3,        .mp3 // MPEG layer 3 */
uint8_t moov[] = "moov";
uint8_t trak[] = "trak";
uint8_t mdia[] = "mdia";
uint8_t minf[] = "minf";
uint8_t stbl[] = "stbl";
uint8_t stsd[] = "stsd";
uint8_t stsc[] = "stsc";
uint8_t stsz[] = "stsz";
uint8_t stco[] = "stco";
uint8_t ftyp[] = "ftyp";
uint8_t mdat[] = "mdat";

typedef struct Atom
{
    unsigned int size;
    uint8_t tag[4];
    int ver_flag;
    unsigned int num_of_entries;
    unsigned int pos;
    uint8_t *data;
} Atom;



uint8_t kmp3[] = {0x6D,0x73,0x00,0x55};
uint8_t fmp3[] = ".mp3";
uint8_t raw[] = "raw ";

uint8_t wave[] = "wave";
uint8_t mp4a[] = "mp4a";
uint8_t enca[] = "enca";//encrypted to ISO/IEC 14496-12 or 3GPP standards

uint8_t smar[] = "smar";//encoded to 3GPP GSM 6.10 AMR narrowband standards

uint8_t sawb[] = "sawb";//encoded to 3GPP GSM 6.10 AMR wideband standards

uint8_t m4ds[] = "m4ds";//encoded to ISO/IEC 14496-10 AVC standards

uint8_t esds[] = "esds";
uint8_t fram[] = "fram";


#define MKTAG(a,b,c,d) (a | (b << 8) | (c << 16) | (d << 24))
typedef struct AVCodecTag {
    int id;
    unsigned int tag;
} AVCodecTag;


typedef struct stsdtable
{
    unsigned int size;
    char format[4];
    int res1;
    int ref;
    short version;
    short pad1;
    int pad2;
    short channels;
    short bitspersample;
    short compress_id;
    short res2;
    short samplerate1;
    short samplerate2;
    //{if(version==1)

        int sampleperpacket;
        int bytesperpacket;
        int bytesperframe;
        int bytespersample;
    //}

} stsdtable;


typedef struct sampletable
{
    unsigned int size;
    unsigned int id_of_sd;
} sampletable;
//MP4Analyze.cpp
#include "MP4Analyze.h"
#include <vector>
#include <map>
#include <iostream>
#include <string>
#ifdef WIN32
#include <winsock2.h>
#pragma comment(lib, "Ws2_32.lib")
#pragma warning (disable:4786)
#endif

#ifdef __GNUG__
#include <netinet/in.h>
#endif
using namespace std;




int check_format(uint8_t *data, int size)
{
    if(strncmp((char*)moov,(char*)(data+4),4)==0 ||
        strncmp((char*)ftyp,(char*)(data+4),4)==0 ||strncmp((char*)mdat,(char*)(data+4),4)==0 )
        return 0;
    return -1;
}

unsigned int get_size(const uint8_t *data,int size)
{
    unsigned int tmp = 0;
    for(int i=0; i<size; ++i)
    {
        tmp <<= 8;
        tmp += *data++;
    }
    return tmp;
}

int seek_tag(uint8_t tag[],uint8_t *data, unsigned int size1,uint8_t **pos,unsigned int *size2)
{
    if(data == NULL || size1 == 0)
        return -1;
    unsigned int tag_size = get_size(data,4);
    if(tag_size >size1 + 8)
        return -1;
    unsigned int tmp = 0;
    while(strncmp((char*)data+4,(char*)tag,4) != 0)
    {
    //    printf("%s/n",data+4);

        if(tag_size==0)
            return -1;
        if(tag_size < size1 + 8)
        {
            data += tag_size;
            tmp += tag_size;
        }
        else
            return -1;
        tag_size = get_size(data,4);
    }
    printf("find :%c%c%c%c/n",tag[0],tag[1],tag[2],tag[3]);
    if(tmp + tag_size > size1 )
     printf("warning: the atom may be not complete!/n");
    *pos = data+8;
    *size2 = tag_size -8;
    return tmp;
}

v文章转载自:http://blog.csdn.net/flyingqr/archive/2010/02/02/5282600.aspx 版权归原作者,编辑:小乙哥

vector<stsdtable>& get_audio_info(uint8_t *data, unsigned int size, vector<stsdtable>& stable)//stsd

{
    uint8_t * datapos = data;
    Atom *stsd_audio =(Atom *)data;
    int tmp_size = 16;

    printf("size : %u/n",ntohl(stsd_audio->size));
    printf("num_entr: %u/n",ntohl(stsd_audio->num_of_entries));

    for(int i=0; i < ntohl(stsd_audio->num_of_entries); ++i)
    {
        if(tmp_size > size)//注意

            return stable;
        datapos += tmp_size;
        stsdtable * audio_entry = (stsdtable *)(datapos);
        stable.push_back(*audio_entry);//这里存入的是网络序的数据,使用时需进行转换

        tmp_size += ntohl(audio_entry->size);

    
        printf("--tablesize: %d/n",ntohl(audio_entry->size));
        printf("--format : %s/n",audio_entry->format);
        printf("--version : %d/n",ntohs(audio_entry->version));
        printf("--channels: %d/n",ntohs(audio_entry->channels));
        printf("--bitpersam: %d/n",ntohs(audio_entry->bitspersample));
        printf("--IDcompress: %d/n",ntohs(audio_entry->compress_id));    
        printf("--samplerate: %d.%d/n",ntohs(audio_entry->samplerate1),ntohs(audio_entry->samplerate2));
        

     tmp_size = sizeof(stsdtable);
        if(ntohs(audio_entry->version)==0)
        {
            tmp_size -= 16;
        }
        datapos += tmp_size;
        //if(ntohs(audio_entry->compress_id)==-2)//此处尚需考证

        if(ntohl(audio_entry->size) > sizeof(stsdtable))
        {
            printf("----atom size:%d/n",get_size(datapos,4));
            printf("----atom name:%c%c%c%c/n",datapos[4],datapos[5],datapos[6],datapos[7]);
            if(strncmp((char*)datapos,(char*)esds,4)==0)
            {
                //handle esds

            }
        }
    }
    return stable;
}

map<unsigned int,sampletable> & get_packet_offset(uint8_t *STBL[], map<unsigned int,sampletable>& table)
{
    //table.insert(pair<long,sampletable>(1,sample));

    unsigned int num_sam_to_chunk = get_size(STBL[0]-4,4);//stsc

    unsigned int num_sample = get_size(STBL[1]-4,4);//stsz

    unsigned int num_chunk = get_size(STBL[2]-4,4);//stco

    unsigned int chunk_index = 0;
    unsigned int next_chunk_index = 0;
    uint8_t *cur_sam_to_chunk = STBL[0];
    uint8_t *cur_sam_size = STBL[1];
    uint8_t *cur_chunk_offset = STBL[2];
    sampletable sample;
    printf("number of stsc entries:%d /nnumber of sample size:%d /nnumber of chunk offset:%d/n",num_sam_to_chunk,num_sample,num_chunk);
    for(unsigned int i = 0; i < num_sam_to_chunk; ++i)//对所有的entries

    {
        chunk_index = get_size(cur_sam_to_chunk,4);
        next_chunk_index = get_size(cur_sam_to_chunk+12,4);
        sample.id_of_sd = get_size(cur_sam_to_chunk+8,4);
        if(i == num_sam_to_chunk -1)//最后一个

        {
            next_chunk_index = num_chunk+1;
        }
        printf("chunk_index:(%d---%d)/n",chunk_index,next_chunk_index);
        for(unsigned int k=chunk_index; k < next_chunk_index; ++k)//当前chunk序号到下一个chunk序号之间的chunk

        {//处理所有重复的chunk

            printf("chunk_index:%d sample num:%d/n",chunk_index,get_size(cur_sam_to_chunk+4,4));
            unsigned int offset = get_size(cur_chunk_offset+(chunk_index-1)*4,4);
            for(unsigned int j=0; j < get_size(cur_sam_to_chunk+4,4); ++j)//chunk内地sample数目

            {//处理该chunk中的sample

                sample.size = get_size(cur_sam_size,4);    
                printf("--sample offset:%d %x size:%d/n",offset,offset,sample.size);
                table.insert(pair<unsigned int,sampletable>(offset,sample));
                offset = offset + sample.size;
                cur_sam_size += 4;
            }
            system("pause");
            chunk_index++;
        }
        cur_sam_to_chunk += 12;
    }
    return table;
}
文章转载自:http://blog.csdn.net/flyingqr/archive/2010/02/02/5282600.aspx 版权归原作者,编辑:小乙哥

int
seek_audio_atom( uint8_t *data1, unsigned int size1)
{
    uint8_t tag[] = "mdiaminfsmhd";
    uint8_t *datapos;
    unsigned int tag_size;
    uint8_t *data;
    unsigned int size;
    int offset_of_atom = 0;
    if((offset_of_atom = seek_tag(moov, data1, size1, &data, &size)) == -1)
        return -1;
    if(offset_of_atom + size >size1)
    {
//some handles

        printf("moov atom is not complete,need more data");
    }
    data1 = data;
    size1 = size;
    uint8_t *nexttrak = data;
    unsigned int traksize = size;
    int i=0;
    while(1)
    {
        printf("-----/n");
        if(seek_tag(trak, nexttrak, traksize, &datapos, &tag_size) != -1)
        {
            nexttrak = datapos + tag_size;
            if(size1 < (nexttrak - data1))
                return -1;
            traksize = size1 - (nexttrak - data1);
            data = datapos;
            size = tag_size;
        }
        else
        {
            return -1;
        }
        i=0;
        while(i<3)
        {
            if(seek_tag(tag+i*4, data, size, &datapos, &tag_size) != -1)
            {
                if(i==2)
                 break;
                data = datapos;
                size = tag_size;
                ++i;
            }
            else
            {
                break;
            }
        }
        if(strncmp("smhd",(char*)(datapos-4),4) == 0)
        {
            if(seek_tag(stbl, data, size, &datapos, &tag_size)!= -1)
            {
                printf("—find audio stbl—!/n");
                data = datapos;
                size = tag_size;

                if(seek_tag(stsd, data, size, &datapos, &tag_size) != -1)
                {
                    vector<stsdtable> stable;
//音频信息

                    get_audio_info(datapos-8, tag_size,stable);
                }

                uint8_t *STBL[3] ={NULL,NULL,NULL};
//

                uint8_t *datapos1;
                unsigned int tag_size1;
//

                if(seek_tag(stsc, data, size, &datapos1, &tag_size1) != -1)
                {
                    STBL[0] = datapos1 + 8;
                }
                uint8_t *datapos2;
                unsigned int tag_size2;
                if(seek_tag(stsz, data, size, &datapos2, &tag_size2) != -1)
                {
                    STBL[1] = datapos2 + 12;
                }
                uint8_t *datapos3;
                unsigned int tag_size3;
                if(seek_tag(stco, data, size, &datapos3, &tag_size3) != -1)
                {
                    STBL[2] = datapos3 + 8;
                }
                if(STBL[0] && STBL[1] && STBL[2] )
                {
                    map<unsigned int,sampletable> postable;
//音频帧信息

                    get_packet_offset(STBL,postable);
                }
            }
            return 0;
        }
    }
    return -1;
}
int main(char arg, char *argv[])
{
    FILE *mp4;
    cout<<"please input the file name :"<<endl;
    string filename;
    cin>>filename;
    mp4 = fopen(filename.c_str(),"rb");
    uint8_t buffer[300000];
    fread(buffer,1,300000,mp4);

    seek_audio_atom((uint8_t*)buffer,300000);

    fclose(mp4);
    return 0;
}

本文来自互联网用户投稿,该文观点仅代表作者本人,不代表本站立场。本站仅提供信息存储空间服务,不拥有所有权,不承担相关法律责任。如若转载,请注明出处:http://www.mzph.cn/news/455335.shtml

如若内容造成侵权/违法违规/事实不符,请联系多彩编程网进行投诉反馈email:809451989@qq.com,一经查实,立即删除!

相关文章

时序图 分支_UML用例图

UML用例图用例图有以下东东:用例参与者关联系统边界用例使用椭圆来表示&#xff0c;椭圆里边写上用例的名称:这里的用例可以理解为一个动作或行为,或者一个对象。参与者用一个小人儿,在小人儿下面写上参与者名称,例如学生:关联用一条线表示:把很多个用例放到一个大的矩形框里。…

Python脚本实现汉子转拼音

起步 中华文化博大精深&#xff0c;是中华民族的财富&#xff0c;吸收和继承发扬中 华文化&#xff0c;是现代每个炎黄子孙无可推卸的天职。 今天小编就交大家用python写一个脚本,实现汉子和拼音之间的转换 pinyin.py 汉字转拼音,With Python Example: from pinyin impor…

MySQL innodb_table_stats表不存在的解决方法

在做实验时&#xff0c;使用mysqldump命令报错[rootlinux-mysql02 3306]# mysqldump -uroot -p123456 -S /u02/data/3306/mysql.sock -A -B --events | gzip > /opt/rep.sql.gzmysqldump: Got error: 1146: Table mysql.innodb_index_stats doesnt exist when using LOCK TA…

自定义封装 banner 组件

1. 效果图预览 2.基本功能 一个简单方便的轮播图组件&#xff0c;基于viewpager 基础上进行的封装。可设置 项目中图片&#xff0c;网络图片&#xff0c; View&#xff1b;支持循环自动播放&#xff0c;手势滑动切换&#xff0c;item点击事件,可设置 点点的样式宽高、颜色、大小…

vb.net服务器启动后cpu占用了70_记一次服务器被异常程序占用的解决过程(怀疑黑客攻击)...

最近在跑实验&#xff0c;但是突然发现程序运行变慢&#xff0c;然后top命令查看程序运行情况&#xff0c;发现有异常进程&#xff0c;名字叫 bash&#xff0c;占用 2400% CPU计算资源。刚开始怀疑是挖矿程序&#xff0c;因实验室网络IP为教育网公网&#xff0c;怀疑被攻击&…

3gp文件格式研究 (转windcao的专栏)

序言 06我开始做3gp文件的播放器,但是关于3gp的文档太少了也很难找,在网友luxh的帮助下,我终于有了第一份关于3gp文件格式的文档《ISO/IEC 14496-12&#xff0c;ISO媒体文件格式》.在此真心感谢luxh的贡献.当然了是英文版的,有文档就不错了.为了便于查阅和理解,我把之后陆续找…

Android开发必用工具及其进阶途径

三百六十行&#xff0c;行行出状元&#xff0c;怎么样才能在Android行业中当个状元了&#xff0c;开发过程中的高效、自我能力的提升显得至关重要&#xff0c;步入IT行业更是要时时刻刻学习&#xff0c;新技术更新快&#xff0c;今天将介绍一下Android开发中必用工具及其进阶途…

MySQL遇到check the manual that corresponds to your MySQL server version for the right syntax错误

原来是MySQL表中不能包含关键字 转载于:https://www.cnblogs.com/flycoding/p/7088465.html

Python脚本实现图片加水印

起步 图片是指由图形、图像等构成的平面媒体,有形式的事物&#xff0c;我们看到的&#xff0c;是图画、照片、拓片等的统称。 为了保护一些原创图片的版权,某些时候我们需要在图片上面,加上水印,当然你可以用Photoshop来做,只不过如果图片数量过多,亦或者图片的动态生成的时候…

yarn 怎么查看有多个job在跑_flink on yarn 模式下提示yarn资源不足问题分析

背景在实时计算平台上通过YarnClient向yarn上提交flink任务时一直卡在那里&#xff0c;并在client端一直输出如下日志&#xff1a;(YarnClusterDescriptor.java:1036)- Deployment took more than 60 seconds. Please check if the requested resources are available in the Y…

MPEG-2TS码流编辑的原理及其应用(转载

[作者&#xff1a;辽宁电视台 赵季伟] 在当今数字媒体不断发展、新媒体业务不断涌现 的前提下&#xff0c;实践证明襁褓中的新媒体只有两种经营方略可供选择&#xff1a;或是购买并集成整套节目&#xff0c;或是低成本深加工新节目&#xff0c;再不可能去按照传统生产模式…

Python中的yield详解

阅读别人的python源码时碰到了这个yield这个关键字&#xff0c;各种搜索终于搞懂了&#xff0c;在此做一下总结&#xff1a; 通常的for…in…循环中&#xff0c;in后面是一个数组&#xff0c;这个数组就是一个可迭代对象&#xff0c;类似的还有链表&#xff0c;字符串&#xf…

shell循环结构之while循环

while循环 1) while CONDITION; dostatementstatement<改变循环条件真假的语句>done 编写脚本&#xff0c;计算1---100的和 #!/bin/bash#sum0i1while [ $i -le 100 ]; dolet sum$sum$ilet i$i1doneecho $sum2) while true; do statementstatementdone #!/bin/bash#while …

python 管道队列_关于python:Multiprocessing-管道与队列

Python的多处理程序包中的队列和管道之间的根本区别是什么&#xff1f;在什么情况下应该选择一种&#xff1f; 什么时候使用Pipe()有优势&#xff1f; 什么时候使用Queue()有优势&#xff1f;Pipe()只能有两个端点。Queue()可以有多个生产者和消费者。何时使用它们如果需要两个…

pip默认使用国内镜像地址

很多小伙伴在ubuntu系统下,使用pip安装会很慢 以为安装源在国外服务器上面 今天小编就教大家配置成让pip默认从国内源中寻找安装包 首先CtrlAltT打开终端 进入家目录 cd ~在家目录中创建一个文件夹,命名为.pip mkdir .pip进入目录,并创建一个名为pip.conf的文件 cd .pip…

“大型票务系统”和“实物电商系统”的数据库选型

讨论请移步至&#xff1a;http://www.zhiliaotech.com/ideajam/idea/detail/423 相关文章&#xff1a; 《今天你买到票了吗&#xff1f;——从铁道部12306.cn站点漫谈电子商务站点的“海量事务快速处理”系统》 不能简单套用“实物电商系统”对“大型票务系统”做需求分析 “大…

FLV文件格式(Z)(转载)

刚才在看一些关于demux的东西&#xff0c;在处理flv格式的文件的时候&#xff0c;由于自己对flv文件的格式不了解&#xff0c;所以就比较云头转向&#xff0c;正好看到了一篇讲述flv文件格式的文章&#xff0c;写的比较明白&#xff0c;所以就转过来了。O(∩_∩)O~flv头文件比较…

mysql-5.7中的innodb_buffer_pool_prefetching(read-ahead)详解

一、innodb的read-ahead是什么&#xff1a; 所谓的read-ahead就是innodb根据你现在访问的数据&#xff0c;推测出你接下来可能要访问的数据&#xff0c;并把它们(可能要访问的数据)读入 内存。 二、read-ahead是怎么做到的&#xff1a; 1、总的来说read-ahead利用的是程序的局部…

python compare excel_python简单操作excle的方法

Python操作Excle文件&#xff1a;使用xlwt库将数据写入Excel表格&#xff0c;使用xlrd 库从Excel读取数据。从excle读取数据存入数据库1、导入模块&#xff1a;import xlrd2、打开excle文件&#xff1a;data xlrd.open_workbook(excel.xls)3、获取表、行/列值、行/列数、单元值…

collections系列

class Counter(dict):  Counter类继承dict类、继承了dict的所有功能计数器&#xff1a; 例&#xff1a;import collections obj collections.Counter(sdkasdioasdjoasjdoasd) print(obj)得&#xff1a;Counter({s: 5, d: 5, a: 4, o: 3, j: 2, k: 1, i: 1}) 拿到前几位&…