ffmpeg_sample解讀_filter_audio

title: ffmpeg_sample解讀_filter_audio
date: 2020-10-28 10:15:02
tags: [讀書筆記]
typora-copy-images-to: ./imgs
typora-root-url: ./imgs

總結(jié)

本示例將生成一個正弦的音頻PCM數(shù)據(jù)舞终，然后把PCM數(shù)據(jù)經(jīng)過如下filterchain的處理。把輸出的每一幀PCM數(shù)據(jù)的MD5值打印出來.

這里就涉及了過濾器相關(guān)的

流程圖

graph TB
 afa[av_frame_alloc]
 -->ama[av_md5_alloc]
 -->ifg[init_filter_graph]
 -->afga[avfilter_graph_alloc]
 -->afgbn[avfilter_get_by_name]
 -->afaf[avfilter_graph_alloc_filter]
 -->afis[avfilter_init_str]
 -->afl[avfilter_link]
 -->afgc[avfilter_graph_config]
 -->gi[get_input]
 -->abaf[av_buffersrc_add_frame]
 -->abgf[av_buffersink_get_frame]
 -->free[free_all]

image-20201028162609381

其實相對好理解. 這里創(chuàng)建了拿到四個過濾器,創(chuàng)建過濾器上下文,設(shè)置參數(shù). 用三種方式是實現(xiàn),然后把四個過濾器連接起來,最后把隨機生成的幀,送入第一個過濾器.然后從最后一個過濾器中取出數(shù)據(jù).打印md5

代碼



/**
 * @file
 * libavfilter API usage example.
 *
 * @example filter_audio.c
 * This example will generate a sine wave audio,
 * pass it through a simple filter chain, and then compute the MD5 checksum of
 * the output data.
 *
 * The filter chain it uses is:
 * (input) -> abuffer -> volume -> aformat -> abuffersink -> (output)
 *
 * abuffer: This provides the endpoint where you can feed the decoded samples.
 * volume: In this example we hardcode it to 0.90.
 * aformat: This converts the samples to the samplefreq, channel layout,
 *          and sample format required by the audio device.
 * abuffersink: This provides the endpoint where you can read the samples after
 *              they have passed through the filter chain.
 */

#include <inttypes.h>
#include <math.h>
#include <stdio.h>
#include <stdlib.h>

#include "libavutil/channel_layout.h"
#include "libavutil/md5.h"
#include "libavutil/mem.h"
#include "libavutil/opt.h"
#include "libavutil/samplefmt.h"

#include "libavfilter/avfilter.h"
#include "libavfilter/buffersink.h"
#include "libavfilter/buffersrc.h"

#define INPUT_SAMPLERATE     48000
#define INPUT_FORMAT         AV_SAMPLE_FMT_FLTP
#define INPUT_CHANNEL_LAYOUT AV_CH_LAYOUT_5POINT0

#define VOLUME_VAL 0.90

/**
 * 創(chuàng)建了四個過濾器上下文.初始化參數(shù),然后連接到一起
 * 初始化過濾器. 這里應(yīng)該是各種轉(zhuǎn)換都是不同的過濾器效果.一層一層處理
 * @param graph
 * @param src
 * @param sink
 * @return
 * 過濾器AVFilter和過濾器上下文AVFilterContext的關(guān)系
 * 過濾器是sdk內(nèi)置的,我們直接可以使用.而過濾器上下文則是相關(guān)的環(huán)境和數(shù)據(jù).
 * 我們總是要根據(jù)過濾器來初始化過濾器上下文. 上下文是和接受的數(shù)據(jù)相關(guān)的.我們操作的數(shù)據(jù)也是操作上下文
 */
static int init_filter_graph(AVFilterGraph **graph, AVFilterContext **src,
                             AVFilterContext **sink) {
    AVFilterGraph *filter_graph;
    AVFilterContext *abuffer_ctx;
    const AVFilter *abuffer;
    AVFilterContext *volume_ctx;
    const AVFilter *volume;
    AVFilterContext *aformat_ctx;
    const AVFilter *aformat;
    AVFilterContext *abuffersink_ctx;
    const AVFilter *abuffersink;

    AVDictionary *options_dict = NULL;
    uint8_t options_str[1024];
    uint8_t ch_layout[64];

    int err;

    /* Create a new filtergraph, which will contain all the filters. */
    filter_graph = avfilter_graph_alloc();//分配過濾器圖形控件
    if (!filter_graph) {
        fprintf(stderr, "Unable to create filter graph.\n");
        return AVERROR(ENOMEM);
    }

    /* Create the abuffer filter;
     * it will be used for feeding the data into the graph. */
    //------1------通過名稱初始化 abuffer過濾器. 看起來應(yīng)該是用來填充數(shù)據(jù)用的
    abuffer = avfilter_get_by_name("abuffer");
    if (!abuffer) {
        fprintf(stderr, "Could not find the abuffer filter.\n");
        return AVERROR_FILTER_NOT_FOUND;
    }
    //通過已有的filter_graph 過濾器圖形生成,名稱是src,返回過濾器上下文
    abuffer_ctx = avfilter_graph_alloc_filter(filter_graph, abuffer, "src");
    if (!abuffer_ctx) {
        fprintf(stderr, "Could not allocate the abuffer instance.\n");
        return AVERROR(ENOMEM);
    }

    //給上邊的 過濾器上下文abuffer_ctx設(shè)置參數(shù). 總共設(shè)置了 四個參數(shù).音頻相關(guān) time_base和sample_rate 是互為倒數(shù)
    /* Set the filter options through the AVOptions API. */
    av_get_channel_layout_string(ch_layout, sizeof(ch_layout), 0, INPUT_CHANNEL_LAYOUT);
    av_opt_set(abuffer_ctx, "channel_layout", ch_layout, AV_OPT_SEARCH_CHILDREN);
    av_opt_set(abuffer_ctx, "sample_fmt", av_get_sample_fmt_name(INPUT_FORMAT),
               AV_OPT_SEARCH_CHILDREN);
    av_opt_set_q(abuffer_ctx, "time_base", (AVRational) {1, INPUT_SAMPLERATE},
                 AV_OPT_SEARCH_CHILDREN);
    av_opt_set_int(abuffer_ctx, "sample_rate", INPUT_SAMPLERATE, AV_OPT_SEARCH_CHILDREN);

    /* Now initialize the filter; we pass NULL options, since we have already
     * set all the options above. */
    //又根據(jù)上表初始化完成的 過濾器上下文來初始化過濾器
    err = avfilter_init_str(abuffer_ctx, NULL);
    if (err < 0) {
        fprintf(stderr, "Could not initialize the abuffer filter.\n");
        return err;
    }
//------2------獲取音量過濾器,然后創(chuàng)建音量過濾器上下文,在給他設(shè)置參數(shù),和上邊的過濾器類似
    /* Create volume filter. */
    volume = avfilter_get_by_name("volume");
    if (!volume) {
        fprintf(stderr, "Could not find the volume filter.\n");
        return AVERROR_FILTER_NOT_FOUND;
    }

    //初始化一個音量過濾器上下文,名稱是volume
    volume_ctx = avfilter_graph_alloc_filter(filter_graph, volume, "volume");
    if (!volume_ctx) {
        fprintf(stderr, "Could not allocate the volume instance.\n");
        return AVERROR(ENOMEM);
    }

    /* A different way of passing the options is as key/value pairs in a
     * dictionary. */
    //-另一種給上下文設(shè)置參數(shù)的方式.總之是先把參數(shù)設(shè)置給AVDictionary自帶,在設(shè)置給上下文
    av_dict_set(&options_dict, "volume", AV_STRINGIFY(VOLUME_VAL), 0);
    err = avfilter_init_dict(volume_ctx, &options_dict);
    av_dict_free(&options_dict);
    if (err < 0) {
        fprintf(stderr, "Could not initialize the volume filter.\n");
        return err;
    }

    /* Create the aformat filter;
     * it ensures that the output is of the format we want. */
    //------3------在找到格式過濾器
    aformat = avfilter_get_by_name("aformat");
    if (!aformat) {
        fprintf(stderr, "Could not find the aformat filter.\n");
        return AVERROR_FILTER_NOT_FOUND;
    }
    //初始化格式過濾器上下文,命名為aformat
    aformat_ctx = avfilter_graph_alloc_filter(filter_graph, aformat, "aformat");
    if (!aformat_ctx) {
        fprintf(stderr, "Could not allocate the aformat instance.\n");
        return AVERROR(ENOMEM);
    }

    /* A third way of passing the options is in a string of the form
     * key1=value1:key2=value2.... */
    //第三種方式,把key,value寫入 options_str這個buf中, 其實就是給options_str設(shè)置值
    snprintf(options_str, sizeof(options_str),
             "sample_fmts=%s:sample_rates=%d:channel_layouts=0x%"PRIx64,
             av_get_sample_fmt_name(AV_SAMPLE_FMT_S16), 44100,
             (uint64_t) AV_CH_LAYOUT_STEREO);
    //用上邊設(shè)置的str 初始化過濾器上下文
    err = avfilter_init_str(aformat_ctx, options_str);
    if (err < 0) {
        av_log(NULL, AV_LOG_ERROR, "Could not initialize the aformat filter.\n");
        return err;
    }

    /* Finally create the abuffersink filter;
     * it will be used to get the filtered data out of the graph. */
    //------4------在找到一個過濾器,下邊肯定會又初始化一個上下文,設(shè)置參數(shù). 方式都是一樣的
    abuffersink = avfilter_get_by_name("abuffersink");
    if (!abuffersink) {
        fprintf(stderr, "Could not find the abuffersink filter.\n");
        return AVERROR_FILTER_NOT_FOUND;
    }
//找到過濾器上下文
    abuffersink_ctx = avfilter_graph_alloc_filter(filter_graph, abuffersink, "sink");
    if (!abuffersink_ctx) {
        fprintf(stderr, "Could not allocate the abuffersink instance.\n");
        return AVERROR(ENOMEM);
    }

    /* This filter takes no options. */
    //沒有默認(rèn)參數(shù)來初始化上下文
    err = avfilter_init_str(abuffersink_ctx, NULL);
    if (err < 0) {
        fprintf(stderr, "Could not initialize the abuffersink instance.\n");
        return err;
    }

    /* Connect the filters;
     * in this simple case the filters just form a linear chain. */
    //把四個過濾器上下文進行連接,形成一個單鏈,上個過濾器的輸出就是下個過濾器的輸入
    err = avfilter_link(abuffer_ctx, 0, volume_ctx, 0);
    if (err >= 0)
        err = avfilter_link(volume_ctx, 0, aformat_ctx, 0);
    if (err >= 0)
        err = avfilter_link(aformat_ctx, 0, abuffersink_ctx, 0);
    if (err < 0) {
        fprintf(stderr, "Error connecting filters\n");
        return err;
    }

    /* Configure the graph. */ //配置過濾器圖形.我理解,四個過濾器上下文都是通過過濾器圖形來創(chuàng)建的.他們肯定是包含在內(nèi)
    err = avfilter_graph_config(filter_graph, NULL);
    if (err < 0) {
        av_log(NULL, AV_LOG_ERROR, "Error configuring the filter graph\n");
        return err;
    }

    *graph = filter_graph;
    //這兩個分別是輸入數(shù)據(jù)和輸出數(shù)據(jù)的過濾器上下文
    *src = abuffer_ctx;
    *sink = abuffersink_ctx;

    return 0;
}

/* Do something useful with the filtered data: this simple
 * example just prints the MD5 checksum of each plane to stdout. */
static int process_output(struct AVMD5 *md5, AVFrame *frame) {
    int planar = av_sample_fmt_is_planar(frame->format);
    int channels = av_get_channel_layout_nb_channels(frame->channel_layout);
    int planes = planar ? channels : 1;
    int bps = av_get_bytes_per_sample(frame->format);
    int plane_size = bps * frame->nb_samples * (planar ? 1 : channels);
    int i, j;

    for (i = 0; i < planes; i++) {
        uint8_t checksum[16];

        av_md5_init(md5);
        av_md5_sum(checksum, frame->extended_data[i], plane_size);

        fprintf(stdout, "plane %d: 0x", i);
        for (j = 0; j < sizeof(checksum); j++)
            fprintf(stdout, "%02X", checksum[j]);
        fprintf(stdout, "\n");
    }
    fprintf(stdout, "\n");

    return 0;
}

/* Construct a frame of audio data to be filtered;
 * this simple example just synthesizes a sine wave. */
//產(chǎn)生一幀數(shù)據(jù).隨機生成的
static int get_input(AVFrame *frame, int frame_num) {
    int err, i, j;

#define FRAME_SIZE 1024

    /* Set up the frame properties and allocate the buffer for the data. */
    frame->sample_rate = INPUT_SAMPLERATE;
    frame->format = INPUT_FORMAT;
    frame->channel_layout = INPUT_CHANNEL_LAYOUT;
    frame->nb_samples = FRAME_SIZE;
    frame->pts = frame_num * FRAME_SIZE;

    err = av_frame_get_buffer(frame, 0);
    if (err < 0)
        return err;

    /* Fill the data for each channel. */
    for (i = 0; i < 5; i++) {
        float *data = (float *) frame->extended_data[i];

        for (j = 0; j < frame->nb_samples; j++)
            data[j] = sin(2 * M_PI * (frame_num + j) * (i + 1) / FRAME_SIZE);
    }

    return 0;
}

/**
 * 本示例將生成一個正弦的音頻PCM數(shù)據(jù)，然后把PCM數(shù)據(jù)經(jīng)過如下filterchain的處理奴饮。把輸出的每一幀PCM數(shù)據(jù)的MD5值打印出來
 * @param argc
 * @param argv
 * @return
 * avfilter_graph_alloc_filter: 在filtergraph中創(chuàng)建一個filter實例。
avfilter_init_str：使用提供的字符串參數(shù)初始化一個filter币绩。
avfilter_init_dict：使用提供的AVDictionary初始化一個filter。
avfilter_link：把兩個filter連接在一起峦树。

作者：smallest_one
鏈接：http://www.reibang.com/p/f677992bbde9
來源：簡書
著作權(quán)歸作者所有渡冻。商業(yè)轉(zhuǎn)載請聯(lián)系作者獲得授權(quán)戚扳，非商業(yè)轉(zhuǎn)載請注明出處。
 */
int filter_audio_main(int argc, char *argv[]) {
    struct AVMD5 *md5;
    AVFilterGraph *graph;
    AVFilterContext *src, *sink;
    AVFrame *frame;
    uint8_t errstr[1024];
    float duration;
    int err, nb_frames, i;

    if (argc < 2) {
        fprintf(stderr, "Usage: %s <duration>\n", argv[0]);
        return 1;
    }

    duration = atof(argv[1]);//char 轉(zhuǎn)float
    nb_frames = duration * INPUT_SAMPLERATE / FRAME_SIZE;//幀數(shù)
    if (nb_frames <= 0) {
        fprintf(stderr, "Invalid duration: %s\n", argv[1]);
        return 1;
    }

    /* Allocate the frame we will be using to store the data. */
    frame = av_frame_alloc(); //初始化未壓縮的幀
    if (!frame) {
        fprintf(stderr, "Error allocating the frame\n");
        return 1;
    }

    md5 = av_md5_alloc();//初始化一個AVMD5
    if (!md5) {
        fprintf(stderr, "Error allocating the MD5 context\n");
        return 1;
    }

    /* Set up the filtergraph. */
    //初始化過濾器視圖,src是最初的過濾器上下文.負(fù)責(zé)輸入數(shù)據(jù) sink是最后的過濾器上下文.負(fù)責(zé)輸出數(shù)據(jù)
    err = init_filter_graph(&graph, &src, &sink);
    if (err < 0) {
        fprintf(stderr, "Unable to init filter graph:");
        goto fail;
    }

    //一幀一幀的循環(huán)遍歷
    /* the main filtering loop */
    for (i = 0; i < nb_frames; i++) {
        /* get an input frame to be filtered */
        err = get_input(frame, i);
        if (err < 0) {
            fprintf(stderr, "Error generating input frame:");
            goto fail;
        }

        /* Send the frame to the input of the filtergraph. */
        //把幀數(shù)據(jù)放到 過濾器中處理
        err = av_buffersrc_add_frame(src, frame);
        if (err < 0) {
            av_frame_unref(frame);
            fprintf(stderr, "Error submitting the frame to the filtergraph:");
            goto fail;
        }

        //從最后的過濾器中把數(shù)據(jù)取出.放回到frame中,這里也就是過濾器完成了幀的處理
        /* Get all the filtered output that is available. */
        while ((err = av_buffersink_get_frame(sink, frame)) >= 0) {
            /* now do something with our filtered frame */
//            打印處理完的幀的md5
            err = process_output(md5, frame);
            if (err < 0) {
                fprintf(stderr, "Error processing the filtered frame:");
                goto fail;
            }
            av_frame_unref(frame);
        }

        if (err == AVERROR(EAGAIN)) {
            /* Need to feed more frames in. */
            continue;
        } else if (err == AVERROR_EOF) {
            /* Nothing more to do, finish. */
            break;
        } else if (err < 0) {
            /* An error occurred. */
            fprintf(stderr, "Error filtering the data:");
            goto fail;
        }
    }

    avfilter_graph_free(&graph);
    av_frame_free(&frame);
    av_freep(&md5);

    return 0;

    fail:
    av_strerror(err, errstr, sizeof(errstr));
    fprintf(stderr, "%s\n", errstr);
    return 1;
}