FFMPEG + SDL音频播放分析
2016-09
睿丰德RFID软件系统集成商
目录 [hide]
抽象流程:
设置SDL的音频参数 —-> 打开声音设备,播放静音 —-> ffmpeg读取音频流中数据放入队列 —-> SDL调用用户设置的函数来获取音频数据 —-> 播放音频
SDL内部维护了一个buffer来存放解码后的数据,这个buffer中的数据来源是我们注册的回调函数(audio_callback),audio_callback调用audio_decode_frame来做具体的音频解码工作,需要引起注意的是:从流中读取出的一个音频包(avpacket)可能含有多个音频桢(avframe),所以需要多次调用avcodec_decode_audio4来完成整个包的解码,解码出来的数据存放在我们自己的缓冲中(audio_buf2)。SDL每一次回调都会引起数据从audio_buf2拷贝到SDL内部缓冲区,当audio_buf2中的数据大于SDL的缓冲区大小时,需要分多次拷贝。
关键实现:
main()函数
1int main(int argc, char **argv){2 SDL_Event event; //SDL事件变量3 VideoState *is; // 纪录视频及解码器等信息的大结构体4 is = (VideoState*) av_mallocz(sizeof(VideoState));5 if(argc < 2){6 fprintf(stderr, "Usage: play <file>\n");7 exit(1);8 }9 av_register_all(); //注册所有ffmpeg的解码器10 /* 初始化SDL,这里只实用了AUDIO,如果有视频,好需要SDL_INIT_VIDEO等等 */11 if(SDL_Init(SDL_INIT_AUDIO)){12 fprintf(stderr, "Count not initialize SDL - %s\n", SDL_GetError());13 exit(1);14 }15 is_strlcpy(is->filename, argv[1], sizeof(is->filename));16 /* 创建一个SDL线程来做视频解码工作,主线程进入SDL事件循环 */17 is->parse_tid = SDL_CreateThread(decode_thread, is);18 if(!is->parse_tid){19 SDL_WaitEvent(&event);20 switch(event.type){21 case FF_QUIT_EVENT:22 case SDL_QUIT:23 is->quit = 1;24 SDL_Quit();25 exit(0);26 break;27 default:28 break;29 }30 }31 return 0;32}decode_thread()读取文件信息和音频包
1static int decode_thread(void *arg){2 VideoState *is = (VideoState*)arg;3 AVFormatContext *ic = NULL;4 AVPacket pkt1, *packet = &pkt1;5 int ret, i, audio_index = -1;67 is->audioStream = -1;8 global_video_state = is; 9 /* 使用ffmpeg打开视频,解码器等 常规工作 */10 if(avFormat_open_input(&ic, is->filename, NULL, NULL) != 0) {11 fprintf(stderr, "open file error: %s\n", is->filename);12 return -1;13 }14 is->ic = ic;15 if(avformat_find_stream_info(ic, NULL) < 0){16 fprintf(stderr, "find stream info error\n");17 return -1;18 }19 av_dump_format(ic, 0, is->filename, 0);20 for(i = 0; i < ic->nb_streams; i++){21 if(ic->streams[i])->codec->codec_type == AVMEDIA_TYPE_AUDIO && audio_index == -1){22 audio_index = i;23 break;24 }25 }26 if(audio_index >= 0) {27 /* 所有设置SDL音频流信息的步骤都在这个函数里完成 */28 stream_component_open(is, audio_index);29 }30 if(is->audioStream < 0){31 fprintf(stderr, "could not open codecs for file: %s\n", is->filename);32 goto fail;33 }34 /* 读包的主循环, av_read_frame不停的从文件中读取数据包(这里只取音频包)*/35 for(;;){36 if(is->quit) break;37 /* 这里audioq.size是指队列中的所有数据包带的音频数据的总量,并不是包的数量 */38 if(is->audioq.size > MAX_AUDIO_SIZE){39 SDL_Delay(10); // 毫秒40 continue;41 }42 ret = av_read_frame(is->ic, packet);43 if(ret < 0){44 if(ret == AVERROR_EOF || url_feof(is->ic->pb)) break;45 if(is->ic->pb && is->ic->pb->error) break;46 contiue; 47 } 48 if(packet->stream_index == is->audioStream){49 packet_queue_put(&is->audioq, packet);50 } else{51 av_free_packet(packet);52 }53 }54 while(!is->quit) SDL_Delay(100);55fail: {56 SDL_Event event;57 event.type = FF_QUIT_EVENT;58 event.user.data1 = is;59 SDL_PushEvent(&event);60 }61 return 0;62}stream_component_open():设置音频参数和打开设备
1int stream_component_open(videoState *is, int stream_index){2 AVFormatContext *ic = is->ic;3 AVCodecContext *codecCtx;4 AVCodec *codec;5 /* 在用SDL_OpenAudio()打开音频设备的时候需要这两个参数*/6 /* wanted_spec是我们期望设置的属性,spec是系统最终接受的参数 */7 /* 我们需要检查系统接受的参数是否正确 */8 SDL_AudioSpec wanted_spec, spec;9 int64_t wanted_channel_layout = 0; // 声道布局(SDL中的具体定义见“FFMPEG结构体”部分) 10 int wanted_nb_channels; // 声道数11 /* SDL支持的声道数为 1, 2, 4, 6 */12 /* 后面我们会使用这个数组来纠正不支持的声道数目 */13 const int next_nb_channels[] = { 0, 0, 1, 6, 2, 6, 4, 6 }; 1415 if(stream_index < 0 || stream_index >= ic->nb_streams) return -1;16 codecCtx = ic->streams[stream_index]->codec;17 wanted_nb_channels = codecCtx->channels;18 if(!wanted_channel_layout || wanted_nb_channels != av_get_channel_layout_nb_channels(wanted_channel_layout)) {19 wanted_channel_layout = av_get_default_channel_lauout(wanted_channel_nb_channels);20 wanted_channel_layout &= ~AV_CH_LAYOUT_STEREO_DOWNMIX;21 }22 wanted_spec.channels = av_get_channels_layout_nb_channels(wanted_channel_layout);23 wanted_spec.freq = codecCtx->sample_rate;24 if(wanted_spec.freq <= 0 || wanted_spec.channels <=0){25 fprintf(stderr, "Invaild sample rate or channel count!\n");26 return -1;27 }28 wanted_spec.format = AUDIO_S16SYS; // 具体含义请查看“SDL宏定义”部分29 wanted_spec.silence = 0; // 0指示静音30 wanted_spec.samples = SDL_AUDIO_BUFFER_SIZE; // 自定义SDL缓冲区大小31 wanted_spec.callback = audio_callback; // 音频解码的关键回调函数32 wanted_spec.userdata = is; // 传给上面回调函数的外带数据3334 /* 打开音频设备,这里使用一个while来循环尝试打开不同的声道数(由上面 */35 /* next_nb_channels数组指定)直到成功打开,或者全部失败 */36 while(SDL_OpenAudio(&wanted_spec, &spec) < 0){37 fprintf(stderr, "SDL_OpenAudio(%d channels): %s\n", wanted_spec.channels, SDL_GetError());38 wanted_spec.channels = next_nb_channels[FFMIN(7, wanted_spec.channels)]; // FFMIN()由ffmpeg定义的宏,返回较小的数39 if(!wanted_spec.channels){40 fprintf(stderr, "No more channel to try\n");41 return -1;42 }43 wanted_channel_layout = av_get_default_channel_layout(wanted_spec.channels);44 }45 /* 检查实际使用的配置(保存在spec,由SDL_OpenAudio()填充) */46 if(spec.format != AUDIO_S16SYS){47 fprintf(stderr, "SDL advised audio format %d is not supported\n", spec.format);48 return -1;49 }50 if(spec.channels != wanted_spec.channels) {51 wanted_channel_layout = av_get_default_channel_layout(spec.channels);52 if(!wanted_channel_layout){53 fprintf(stderr, "SDL advised channel count %d is not support\n", spec.channels);54 return -1;55 }56 }57 /* 把设置好的参数保存到大结构中 */58 is->audio_src_fmt = is->audio_tgt_fmt = AV_SAMPLE_FMT_S16;59 is->audio_src_freq = is->audio_tgt_freq = spec.freq;60 is->audio_src_channel_layout = is->audio_tgt_layout = wanted_channel_layout;61 is->audio_src_channels = is->audio_tat_channels = spec.channels;6263 codec = avcodec_find_decoder(codecCtx>codec_id);64 if(!codec || (avcodec_open2(codecCtx, codec, NULL) < 0)){65 fprintf(stderr, "Unsupported codec!\n");66 return -1;67 }68 ic->streams[stream_index]->discard = AVDISCARD_DEFAULT; //具体含义请查看“FFMPEG宏定义”部分69 is->audioStream = stream_index;70 is->audio_st = ic->streams[stream_index];71 is->audio_buf_size = 0;72 is->audio_buf_index = 0;73 memset(&is->audio_pkt, 0, sizeof(is->audio_pkt));74 packet_queue_init(&is->audioq);75 SDL_PauseAudio(0); // 开始播放静音76}audio_callback(): 回调函数,向SDL缓冲区填充数据
1void audio_callback(void *userdata, Uint8 *stream, int len){2 VideoState *is = (VideoState*)userdata;3 int len1, audio_data_size;45 /* len是由SDL传入的SDL缓冲区的大小,如果这个缓冲未满,我们就一直往里填充数据 */6 while(len > 0){7 /* audio_buf_index 和 audio_buf_size 标示我们自己用来放置解码出来的数据的缓冲区,*/8 /* 这些数据待copy到SDL缓冲区, 当audio_buf_index >= audio_buf_size的时候意味着我*/9 /* 们的缓冲为空,没有数据可供copy,这时候需要调用audio_decode_frame来解码出更10 /* 多的桢数据 */11 if(is->audio_buf_index >= is->audio_buf_size){12 audio_data_size = audio_decode_frame(is);13 /* audio_data_size < 0 标示没能解码出数据,我们默认播放静音 */14 is(audio_data_size < 0){15 is->audio_buf_size = 1024;16 /* 清零,静音 */17 memset(is->audio_buf, 0, is->audio_buf_size);18 } else{19 is->audio_buf_size = audio_data_size;20 }21 is->audio_buf_index = 0;22 }23 /* 查看stream可用空间,决定一次copy多少数据,剩下的下次继续copy */24 len1 = is->audio_buf_size - is->audio_buf_index;25 if(len1 > len) len1 = len;2627 memcpy(stream, (uint8_t*)is->audio_buf + is->audio_buf_index, len1);28 len -= len1;29 stream += len1;30 is->audio_buf_index += len1;31 }32}audio_decode_frame():解码音频
1int audio_decode_frame(VideoState *is){2 int len1, len2, decoded_data_size;3 AVPacket *pkt = &is->audio_pkt;4 int got_frame = 0;5 int64_t dec_channel_layout;6 int wanted_nb_samples, resampled_data_size;78 for(;;){9 while(is->audio_pkt_size > 0){10 if(!is->audio_frame){11 if(!(is->audio_frame = avacodec_alloc_frame())){12 return AVERROR(ENOMEM);13 }14 } else15 avcodec_get_frame_defaults(is->audio_frame);1617 len1 = avcodec_decode_audio4(is->audio_st_codec, is->audio_frame, got_frame, pkt);18 /* 解码错误,跳过整个包 */19 if(len1 < 0){20 is->audio_pkt_size = 0;21 break;22 }23 is->audio_pkt_data += len1;24 is->audio_pkt_size -= len1;25 if(!got_frame) continue;26 /* 计算解码出来的桢需要的缓冲大小 */27 decoded_data_size = av_samples_get_buffer_size(NULL,28 is->audio_frame_channels,29 is->audio_frame_nb_samples,30 is->audio_frame_format, 1);31 dec_channel_layout = (is->audio_frame->channel_layout && is->audio_frame->channels32 == av_get_channel_layout_nb_channels(is->audio_frame->channel_layout))33 ? is->audio_frame->channel_layout : av_get_default_channel_layout(is->audio_frame->channels); 34 wanted_nb_samples = is->audio_frame->nb_samples;35 if (is->audio_frame->format != is->audio_src_fmt || 36 dec_channel_layout != is->audio_src_channel_layout ||37 is->audio_frame->sample_rate != is->audio_src_freq || 38 (wanted_nb_samples != is->audio_frame->nb_samples && !is->swr_ctx)) {39 if (is->swr_ctx) swr_free(&is->swr_ctx);40 is->swr_ctx = swr_alloc_set_opts(NULL,41 is->audio_tgt_channel_layout,42 is->audio_tgt_fmt,43 is->audio_tgt_freq,44 dec_channel_layout,45 is->audio_frame->format,46 is->audio_frame->sample_rate,47 0, NULL);48 if (!is->swr_ctx || swr_init(is->swr_ctx) < 0) {49 fprintf(stderr, "swr_init() failed\n");50 break;51 }52 is->audio_src_channel_layout = dec_channel_layout;53 is->audio_src_channels = is->audio_st->codec->channels;54 is->audio_src_freq = is->audio_st->codec->sample_rate;55 is->audio_src_fmt = is->audio_st->codec->sample_fmt;56 }57 /* 这里我们可以对采样数进行调整,增加或者减少,一般可以用来做声画同步 */58 if (is->swr_ctx) {59 const uint8_t **in = (const uint8_t **)is->audio_frame->extended_data;60 uint8_t *out[] = { is->audio_buf2 };61 if (wanted_nb_samples != is->audio_frame->nb_samples) {62 if(swr_set_compensation(is->swr_ctx, 63 (wanted_nb_samples - is->audio_frame->nb_samples)*is->audio_tgt_freq/is->audio_frame->sample_rate,64 wanted_nb_samples * is->audio_tgt_freq/is->audio_frame->sample_rate) < 0) {65 fprintf(stderr, "swr_set_compensation() failed\n");66 break;67 }68 }69 len2 = swr_convert(is->swr_ctx, out, 70 sizeof(is->audio_buf2)/is->audio_tgt_channels/av_get_bytes_per_sample(is->audio_tgt_fmt), 71 in, is->audio_frame->nb_samples);72 if (len2 < 0) {73 fprintf(stderr, "swr_convert() failed\n");74 break;75 }76 if(len2 == sizeof(is->audio_buf2)/is->audio_tgt_channels/av_get_bytes_per_sample(is->audio_tgt_fmt)) {77 fprintf(stderr, "warning: audio buffer is probably too small\n");78 swr_init(is->swr_ctx);79 }80 is->audio_buf = is->audio_buf2;81 resampled_data_size = len2*is->audio_tgt_channels*av_get_bytes_per_sample(is->audio_tgt_fmt);82 } else {83 resampled_data_size = decoded_data_size;84 is->audio_buf = is->audio_frame->data[0];85 }86 /* 返回得到的数据 */87 return resampled_data_size;88 }89 if (pkt->data) av_free_packet(pkt);90 memset(pkt, 0, sizeof(*pkt));91 if (is->quit) return -1;92 if (packet_queue_get(&is->audioq, pkt, 1) < 0) return -1;93 is->audio_pkt_data = pkt->data;94 is->audio_pkt_size = pkt->size;9596 }97}FFMPEG结构体
channel_layout_map
1static const struct {2const char *name;3int nb_channels;4uint64_t layout;5} channel_layout_map[] = {6{ "mono", 1, AV_CH_LAYOUT_MONO },7{ "stereo", 2, AV_CH_LAYOUT_STEREO },8{ "2.1", 3, AV_CH_LAYOUT_2POINT1 },9{ "3.0", 3, AV_CH_LAYOUT_SURROUND },10{ "3.0(back)", 3, AV_CH_LAYOUT_2_1 },11{ "4.0", 4, AV_CH_LAYOUT_4POINT0 },12{ "quad", 4, AV_CH_LAYOUT_QUAD },13{ "quad(side)", 4, AV_CH_LAYOUT_2_2 },14{ "3.1", 4, AV_CH_LAYOUT_3POINT1 },15{ "5.0", 5, AV_CH_LAYOUT_5POINT0_BACK },16{ "5.0(side)", 5, AV_CH_LAYOUT_5POINT0 },17{ "4.1", 5, AV_CH_LAYOUT_4POINT1 },18{ "5.1", 6, AV_CH_LAYOUT_5POINT1_BACK },19{ "5.1(side)", 6, AV_CH_LAYOUT_5POINT1 },20{ "6.0", 6, AV_CH_LAYOUT_6POINT0 },21{ "6.0(front)", 6, AV_CH_LAYOUT_6POINT0_FRONT },22{ "hexagonal", 6, AV_CH_LAYOUT_HEXAGONAL },23{ "6.1", 7, AV_CH_LAYOUT_6POINT1 },24{ "6.1", 7, AV_CH_LAYOUT_6POINT1_BACK },25{ "6.1(front)", 7, AV_CH_LAYOUT_6POINT1_FRONT },26{ "7.0", 7, AV_CH_LAYOUT_7POINT0 },27{ "7.0(front)", 7, AV_CH_LAYOUT_7POINT0_FRONT },28{ "7.1", 8, AV_CH_LAYOUT_7POINT1 },29{ "7.1(wide)", 8, AV_CH_LAYOUT_7POINT1_WIDE },30{ "octagonal", 8, AV_CH_LAYOUT_OCTAGONAL },31{ "downmix", 2, AV_CH_LAYOUT_STEREO_DOWNMIX, },32};FFMPEG宏定义
Audio channel convenience macros
1#define AV_CH_LAYOUT_MONO (AV_CH_FRONT_CENTER)2 #define AV_CH_LAYOUT_STEREO (AV_CH_FRONT_LEFT|AV_CH_FRONT_RIGHT)3 #define AV_CH_LAYOUT_2POINT1 (AV_CH_LAYOUT_STEREO|AV_CH_LOW_FREQUENCY)4 #define AV_CH_LAYOUT_2_1 (AV_CH_LAYOUT_STEREO|AV_CH_BACK_CENTER)5 #define AV_CH_LAYOUT_SURROUND (AV_CH_LAYOUT_STEREO|AV_CH_FRONT_CENTER)6 #define AV_CH_LAYOUT_3POINT1 (AV_CH_LAYOUT_SURROUND|AV_CH_LOW_FREQUENCY)7 #define AV_CH_LAYOUT_4POINT0 (AV_CH_LAYOUT_SURROUND|AV_CH_BACK_CENTER)8 #define AV_CH_LAYOUT_4POINT1 (AV_CH_LAYOUT_4POINT0|AV_CH_LOW_FREQUENCY)9 #define AV_CH_LAYOUT_2_2 (AV_CH_LAYOUT_STEREO|AV_CH_SIDE_LEFT|AV_CH_SIDE_RIGHT)10 #define AV_CH_LAYOUT_QUAD (AV_CH_LAYOUT_STEREO|AV_CH_BACK_LEFT|AV_CH_BACK_RIGHT)11 #define AV_CH_LAYOUT_5POINT0 (AV_CH_LAYOUT_SURROUND|AV_CH_SIDE_LEFT|AV_CH_SIDE_RIGHT)12 #define AV_CH_LAYOUT_5POINT1 (AV_CH_LAYOUT_5POINT0|AV_CH_LOW_FREQUENCY)13 #define AV_CH_LAYOUT_5POINT0_BACK (AV_CH_LAYOUT_SURROUND|AV_CH_BACK_LEFT|AV_CH_BACK_RIGHT)14 #define AV_CH_LAYOUT_5POINT1_BACK (AV_CH_LAYOUT_5POINT0_BACK|AV_CH_LOW_FREQUENCY)15 #define AV_CH_LAYOUT_6POINT0 (AV_CH_LAYOUT_5POINT0|AV_CH_BACK_CENTER)16 #define AV_CH_LAYOUT_6POINT0_FRONT (AV_CH_LAYOUT_2_2|AV_CH_FRONT_LEFT_OF_CENTER|AV_CH_FRONT_RIGHT_OF_CENTER)17 #define AV_CH_LAYOUT_HEXAGONAL (AV_CH_LAYOUT_5POINT0_BACK|AV_CH_BACK_CENTER)18 #define AV_CH_LAYOUT_6POINT1 (AV_CH_LAYOUT_5POINT1|AV_CH_BACK_CENTER)19 #define AV_CH_LAYOUT_6POINT1_BACK (AV_CH_LAYOUT_5POINT1_BACK|AV_CH_BACK_CENTER)20 #define AV_CH_LAYOUT_6POINT1_FRONT (AV_CH_LAYOUT_6POINT0_FRONT|AV_CH_LOW_FREQUENCY)21 #define AV_CH_LAYOUT_7POINT0 (AV_CH_LAYOUT_5POINT0|AV_CH_BACK_LEFT|AV_CH_BACK_RIGHT)22 #define AV_CH_LAYOUT_7POINT0_FRONT (AV_CH_LAYOUT_5POINT0|AV_CH_FRONT_LEFT_OF_CENTER|AV_CH_FRONT_RIGHT_OF_CENTER)23 #define AV_CH_LAYOUT_7POINT1 (AV_CH_LAYOUT_5POINT1|AV_CH_BACK_LEFT|AV_CH_BACK_RIGHT)24#define AV_CH_LAYOUT_7POINT1_WIDE (AV_CH_LAYOUT_5POINT1|AV_CH_FRONT_LEFT_OF_CENTER|AV_CH_FRONT_RIGHT_OF_CENTER)25#define AV_CH_LAYOUT_7POINT1_WIDE_BACK (AV_CH_LAYOUT_5POINT1_BACK|AV_CH_FRONT_LEFT_OF_CENTER|AV_CH_FRONT_RIGHT_OF_CENTER)26#define AV_CH_LAYOUT_OCTAGONAL (AV_CH_LAYOUT_5POINT0|AV_CH_BACK_LEFT|AV_CH_BACK_CENTER|AV_CH_BACK_RIGHT)27#define AV_CH_LAYOUT_STEREO_DOWNMIX (AV_CH_STEREO_LEFT|AV_CH_STEREO_RIGHT)SDL宏定义
SDL_AudioSpec format
查看源代码 打印帮助1AUDIO_U8 Unsigned 8-bit samples2AUDIO_S8 Signed 8-bit samples3AUDIO_U16LSB Unsigned 16-bit samples, in little-endian byte order4AUDIO_S16LSB Signed 16-bit samples, in little-endian byte order5AUDIO_U16MSB Unsigned 16-bit samples, in big-endian byte order6AUDIO_S16MSB Signed 16-bit samples, in big-endian byte order7AUDIO_U16 same as AUDIO_U16LSB (for backwards compatability probably)8AUDIO_S16 same as AUDIO_S16LSB (for backwards compatability probably)9AUDIO_U16SYS Unsigned 16-bit samples, in system byte order10AUDIO_S16SYS Signed 16-bit samples, in system byte ordergit clone https://github.com/lnmcc/musicPlayer.git
RFID管理系统集成商 RFID中间件 条码系统中间层 物联网软件集成