前往小程序,Get更优阅读体验!
立即前往
首页
学习
活动
专区
工具
TVP
发布
社区首页 >专栏 >2023-04-15:ffmpeg的filter_audio.c的功能是生成一个正弦波音频,然后通过简单的滤镜链,最后输出数据的MD5校验和。请用go语言改写。

2023-04-15:ffmpeg的filter_audio.c的功能是生成一个正弦波音频,然后通过简单的滤镜链,最后输出数据的MD5校验和。请用go语言改写。

原创
作者头像
福大大架构师每日一题
发布2023-04-15 20:29:35
2950
发布2023-04-15 20:29:35
举报

2023-04-15:ffmpeg的filter_audio.c的功能是生成一个正弦波音频,然后通过简单的滤镜链,最后输出数据的MD5校验和。请用go语言改写。

答案2023-04-15:

代码见github/moonfdd/ffmpeg-go库。

以下是通过 Go 语言重新实现 ffmpeg 的 filter_audio.c 功能的步骤:

  1. 导入必要的依赖包和定义常量和变量。
  2. 初始化 FFmpeg 库文件路径。
  3. 创建一个音频滤镜图,并将 abuffer、volume 和 aformat 滤镜连接起来。其中,abuffer 滤镜用于获取输入音频采样,volume 滤镜用于调节音频音量,aformat 滤镜用于设置输出音频格式。
  4. 创建输出音频流的 AVCodecContext 上下文,并设置相关属性。
  5. 使用 avcodec_find_encoder_by_name 函数查找 PCM S16LE 编码器,然后创建编码器的 AVCodec 上下文。
  6. 打开编码器并写入头部信息。
  7. 循环读取音频帧,将其发送到音频滤镜图进行处理。
  8. 从滤镜图中获取输出音频帧,并将其编码为 PCM S16LE 格式。
  9. 计算输出音频帧的 MD5 校验和,并将其打印到标准输出上。
  10. 释放资源,结束程序运行。

以上就是使用 Go 语言对 filter_audio.c 文件进行重新实现的步骤。

命令如下:

代码语言:shell
复制
go run ./examples/internalexamples/filter_audio/main.go 1

go代码如下:

代码语言:go
复制
package main

import (
	"fmt"
	"math"
	"os"
	"strconv"
	"unsafe"

	"github.com/moonfdd/ffmpeg-go/ffcommon"
	"github.com/moonfdd/ffmpeg-go/libavfilter"
	"github.com/moonfdd/ffmpeg-go/libavutil"
)

func main0() (ret ffcommon.FInt) {
	var md5 *libavutil.AVMD5
	var graph *libavfilter.AVFilterGraph
	var src, sink *libavfilter.AVFilterContext
	var frame *libavutil.AVFrame
	var errstr [1024]ffcommon.FUint8T
	var duration ffcommon.FFloat
	var err, nb_frames, i ffcommon.FInt

	if len(os.Args) < 2 {
		fmt.Printf("Usage: %s <duration>\n", os.Args[0])
		return 1
	}

	f, err2 := strconv.ParseFloat(os.Args[1], 32)
	if err2 != nil {
		// handle error
		return 1
	}
	duration = float32(f)
	nb_frames = int32(float64(duration) * INPUT_SAMPLERATE / FRAME_SIZE)
	if nb_frames <= 0 {
		fmt.Printf("Invalid duration: %s\n", os.Args[1])
		return 1
	}

	/* Allocate the frame we will be using to store the data. */
	frame = libavutil.AvFrameAlloc()
	if frame == nil {
		fmt.Printf("Error allocating the frame\n")
		return 1
	}

	md5 = libavutil.AvMd5Alloc()
	if md5 == nil {
		fmt.Printf("Error allocating the MD5 context\n")
		return 1
	}

	/* Set up the filtergraph. */
	err = init_filter_graph(&graph, &src, &sink)
	if err < 0 {
		fmt.Printf("Unable to init filter graph:")
		goto fail
	}

	/* the main filtering loop */
	for i = 0; i < nb_frames; i++ {
		// /* get an input frame to be filtered */
		err = get_input(frame, i)
		if err < 0 {
			fmt.Printf("Error generating input frame:")
			goto fail
		}

		/* Send the frame to the input of the filtergraph. */
		err = src.AvBuffersrcAddFrame(frame)
		if err < 0 {
			frame.AvFrameUnref()
			fmt.Printf("Error submitting the frame to the filtergraph:")
			goto fail
		}

		/* Get all the filtered output that is available. */
		err = sink.AvBuffersinkGetFrame(frame)
		for err >= 0 {
			/* now do something with our filtered frame */
			err = process_output(md5, frame)
			if err < 0 {
				fmt.Printf("Error processing the filtered frame:")
				goto fail
			}
			frame.AvFrameUnref()
			err = sink.AvBuffersinkGetFrame(frame)
		}

		if err == -libavutil.EAGAIN {
			/* Need to feed more frames in. */
			continue
		} else if err == libavutil.AVERROR_EOF {
			/* Nothing more to do, finish. */
			break
		} else if err < 0 {
			/* An error occurred. */
			fmt.Printf("Error filtering the data:")
			goto fail
		}
	}

	libavfilter.AvfilterGraphFree(&graph)
	libavutil.AvFrameFree(&frame)
	libavutil.AvFreep(uintptr(unsafe.Pointer(&md5)))

	return 0

fail:
	libavutil.AvStrerror(err, (*byte)(unsafe.Pointer(&errstr)), uint64(len(errstr)))
	fmt.Printf("%s\n", errstr)
	return 1
}

const INPUT_SAMPLERATE = 48000
const INPUT_FORMAT = libavutil.AV_SAMPLE_FMT_FLTP
const INPUT_CHANNEL_LAYOUT = libavutil.AV_CH_LAYOUT_5POINT0

const VOLUME_VAL = 0.90

func init_filter_graph(graph **libavfilter.AVFilterGraph, src **libavfilter.AVFilterContext,
	sink **libavfilter.AVFilterContext) ffcommon.FInt {
	var filter_graph *libavfilter.AVFilterGraph
	var abuffer_ctx *libavfilter.AVFilterContext
	var abuffer *libavfilter.AVFilter
	var volume_ctx *libavfilter.AVFilterContext
	var volume *libavfilter.AVFilter
	var aformat_ctx *libavfilter.AVFilterContext
	var aformat *libavfilter.AVFilter
	var abuffersink_ctx *libavfilter.AVFilterContext
	var abuffersink *libavfilter.AVFilter

	var options_dict *libavutil.AVDictionary
	var options_str string
	var ch_layout [64]ffcommon.FUint8T

	var err ffcommon.FInt

	/* Create a new filtergraph, which will contain all the filters. */
	filter_graph = libavfilter.AvfilterGraphAlloc()
	if filter_graph == nil {
		fmt.Printf("Unable to create filter graph.\n")
		return libavutil.ENOMEM
	}

	/* Create the abuffer filter;
	 * it will be used for feeding the data into the graph. */
	abuffer = libavfilter.AvfilterGetByName("abuffer")
	if abuffer == nil {
		fmt.Printf("Could not find the abuffer filter.\n")
		return libavutil.AVERROR_FILTER_NOT_FOUND
	}

	abuffer_ctx = filter_graph.AvfilterGraphAllocFilter(abuffer, "src")
	if abuffer_ctx == nil {
		fmt.Printf("Could not allocate the abuffer instance.\n")
		return -libavutil.ENOMEM
	}

	/* Set the filter options through the AVOptions API. */
	libavutil.AvGetChannelLayoutString((*byte)(unsafe.Pointer(&ch_layout)), int32(len(ch_layout)), 0, INPUT_CHANNEL_LAYOUT)
	libavutil.AvOptSet(uintptr(unsafe.Pointer(abuffer_ctx)), "channel_layout", ffcommon.StringFromPtr(uintptr(unsafe.Pointer(&ch_layout))), libavutil.AV_OPT_SEARCH_CHILDREN)
	libavutil.AvOptSet(uintptr(unsafe.Pointer(abuffer_ctx)), "sample_fmt", libavutil.AvGetSampleFmtName(INPUT_FORMAT), libavutil.AV_OPT_SEARCH_CHILDREN)
	libavutil.AvOptSetQ(uintptr(unsafe.Pointer(abuffer_ctx)), "time_base", libavutil.AVRational{1, INPUT_SAMPLERATE}, libavutil.AV_OPT_SEARCH_CHILDREN)
	libavutil.AvOptSetInt(uintptr(unsafe.Pointer(abuffer_ctx)), "sample_rate", INPUT_SAMPLERATE, libavutil.AV_OPT_SEARCH_CHILDREN)

	/* Now initialize the filter; we pass NULL options, since we have already
	 * set all the options above. */
	err = abuffer_ctx.AvfilterInitStr("")
	if err < 0 {
		fmt.Printf("Could not initialize the abuffer filter.\n")
		return err
	}

	/* Create volume filter. */
	volume = libavfilter.AvfilterGetByName("volume")
	if volume == nil {
		fmt.Printf("Could not find the volume filter.\n")
		return libavutil.AVERROR_FILTER_NOT_FOUND
	}

	volume_ctx = filter_graph.AvfilterGraphAllocFilter(volume, "volume")
	if volume_ctx == nil {
		fmt.Printf("Could not allocate the volume instance.\n")
		return -libavutil.ENOMEM
	}

	/* A different way of passing the options is as key/value pairs in a
	 * dictionary. */
	libavutil.AvDictSet(&options_dict, "volume", fmt.Sprint(VOLUME_VAL), 0)
	err = volume_ctx.AvfilterInitDict(&options_dict)
	libavutil.AvDictFree(&options_dict)
	if err < 0 {
		fmt.Printf("Could not initialize the volume filter.\n")
		return err
	}

	/* Create the aformat filter;
	 * it ensures that the output is of the format we want. */
	aformat = libavfilter.AvfilterGetByName("aformat")
	if aformat == nil {
		fmt.Printf("Could not find the aformat filter.\n")
		return libavutil.AVERROR_FILTER_NOT_FOUND
	}

	aformat_ctx = filter_graph.AvfilterGraphAllocFilter(aformat, "aformat")
	if aformat_ctx == nil {
		fmt.Printf("Could not allocate the aformat instance.\n")
		return -libavutil.ENOMEM
	}

	/* A third way of passing the options is in a string of the form
	 * key1=value1:key2=value2.... */
	// snprintf(options_str, sizeof(options_str),
	//          "sample_fmts=%s:sample_rates=%d:channel_layouts=0x%"PRIx64,
	//          av_get_sample_fmt_name(AV_SAMPLE_FMT_S16), 44100,
	//          (uint64_t)AV_CH_LAYOUT_STEREO);
	options_str = fmt.Sprintf("sample_fmts=%s:sample_rates=%d:channel_layouts=0x%x",
		libavutil.AvGetSampleFmtName(libavutil.AV_SAMPLE_FMT_S16), 44100,
		libavutil.AV_CH_LAYOUT_STEREO)
	fmt.Println(options_str)
	err = aformat_ctx.AvfilterInitStr(options_str)
	if err < 0 {
		libavutil.AvLog(uintptr(0), libavutil.AV_LOG_ERROR, "Could not initialize the aformat filter.\n")
		return err
	}

	/* Finally create the abuffersink filter;
	 * it will be used to get the filtered data out of the graph. */
	abuffersink = libavfilter.AvfilterGetByName("abuffersink")
	if abuffersink == nil {
		fmt.Printf("Could not find the abuffersink filter.\n")
		return libavutil.AVERROR_FILTER_NOT_FOUND
	}

	abuffersink_ctx = filter_graph.AvfilterGraphAllocFilter(abuffersink, "sink")
	if abuffersink_ctx == nil {
		fmt.Printf("Could not allocate the abuffersink instance.\n")
		return -libavutil.ENOMEM
	}

	/* This filter takes no options. */
	err = abuffersink_ctx.AvfilterInitStr("")
	if err < 0 {
		fmt.Printf("Could not initialize the abuffersink instance.\n")
		return err
	}

	/* Connect the filters;
	 * in this simple case the filters just form a linear chain. */
	err = abuffer_ctx.AvfilterLink(0, volume_ctx, 0)
	if err >= 0 {
		err = volume_ctx.AvfilterLink(0, aformat_ctx, 0)
	}
	if err >= 0 {
		err = aformat_ctx.AvfilterLink(0, abuffersink_ctx, 0)
	}
	if err < 0 {
		fmt.Printf("Error connecting filters\n")
		return err
	}

	/* Configure the graph. */
	err = filter_graph.AvfilterGraphConfig(uintptr(0))
	if err < 0 {
		libavutil.AvLog(uintptr(0), libavutil.AV_LOG_ERROR, "Error configuring the filter graph\n")
		return err
	}

	*graph = filter_graph
	*src = abuffer_ctx
	*sink = abuffersink_ctx

	return 0
}

/* Do something useful with the filtered data: this simple
 * example just prints the MD5 checksum of each plane to stdout. */
func process_output(md5 *libavutil.AVMD5, frame *libavutil.AVFrame) ffcommon.FInt {
	planar := libavutil.AvSampleFmtIsPlanar(libavutil.AVSampleFormat(frame.Format))
	channels := libavutil.AvGetChannelLayoutNbChannels(frame.ChannelLayout)
	planes := channels
	if planar == 0 {
		planes = 1
	}
	bps := libavutil.AvGetBytesPerSample(libavutil.AVSampleFormat(frame.Format))
	plane_size := bps * frame.NbSamples
	if planar == 0 {
		plane_size = plane_size * channels
	}
	var i, j ffcommon.FInt

	for i = 0; i < planes; i++ {
		var checksum [16]ffcommon.FUint8T

		md5.AvMd5Init()
		ptr := *(*uintptr)(unsafe.Pointer(uintptr(unsafe.Pointer(frame.ExtendedData)) + uintptr(i*8)))
		libavutil.AvMd5Sum((*byte)(unsafe.Pointer(&checksum)), (*byte)(unsafe.Pointer(ptr)), plane_size)

		fmt.Printf("plane %d: 0x", i)
		for j = 0; j < int32(len(checksum)); j++ {
			fmt.Printf("%02X", checksum[j])
		}
		fmt.Printf("\n")
	}
	fmt.Printf("\n")

	return 0
}

const FRAME_SIZE = 1024

/* Construct a frame of audio data to be filtered;
 * this simple example just synthesizes a sine wave. */
func get_input(frame *libavutil.AVFrame, frame_num ffcommon.FInt) ffcommon.FInt {
	var err, i, j ffcommon.FInt

	// #define FRAME_SIZE 1024

	/* Set up the frame properties and allocate the buffer for the data. */
	frame.SampleRate = INPUT_SAMPLERATE
	frame.Format = INPUT_FORMAT
	frame.ChannelLayout = INPUT_CHANNEL_LAYOUT
	frame.NbSamples = FRAME_SIZE
	frame.Pts = int64(frame_num) * FRAME_SIZE

	err = frame.AvFrameGetBuffer(0)
	if err < 0 {
		return err
	}

	/* Fill the data for each channel. */
	for i = 0; i < 5; i++ {
		// float *data = (float*)frame->extended_data[i];
		ptr := *(*uintptr)(unsafe.Pointer(uintptr(unsafe.Pointer(frame.ExtendedData)) + uintptr(i*8)))
		data := (*ffcommon.FFloat)(unsafe.Pointer(ptr))

		for j = 0; j < frame.NbSamples; j++ {
			*(*ffcommon.FFloat)(unsafe.Pointer(uintptr(unsafe.Pointer(data)) + uintptr(4*j))) = float32(math.Sin(2 * libavutil.M_PI * (float64(frame_num + j)) * float64((i+1)/FRAME_SIZE)))
		}
	}

	return 0
}

func main() {
	// go run ./examples/internalexamples/filter_audio/main.go 1
	os.Setenv("Path", os.Getenv("Path")+";./lib")
	ffcommon.SetAvutilPath("./lib/avutil-56.dll")
	ffcommon.SetAvcodecPath("./lib/avcodec-58.dll")
	ffcommon.SetAvdevicePath("./lib/avdevice-58.dll")
	ffcommon.SetAvfilterPath("./lib/avfilter-7.dll")
	ffcommon.SetAvformatPath("./lib/avformat-58.dll")
	ffcommon.SetAvpostprocPath("./lib/postproc-55.dll")
	ffcommon.SetAvswresamplePath("./lib/swresample-3.dll")
	ffcommon.SetAvswscalePath("./lib/swscale-5.dll")

	genDir := "./out"
	_, err := os.Stat(genDir)
	if err != nil {
		if os.IsNotExist(err) {
			os.Mkdir(genDir, 0777) //  Everyone can read write and execute
		}
	}

	main0()
}

运行结果如下:

原创声明:本文系作者授权腾讯云开发者社区发表,未经许可,不得转载。

如有侵权,请联系 cloudcommunity@tencent.com 删除。

原创声明:本文系作者授权腾讯云开发者社区发表,未经许可,不得转载。

如有侵权,请联系 cloudcommunity@tencent.com 删除。

评论
登录后参与评论
0 条评论
热度
最新
推荐阅读
目录
  • 以下是通过 Go 语言重新实现 ffmpeg 的 filter_audio.c 功能的步骤:
  • 命令如下:
  • go代码如下:
  • 运行结果如下:
相关产品与服务
实时音视频
实时音视频(Tencent RTC)基于腾讯21年来在网络与音视频技术上的深度积累,以多人音视频通话和低延时互动直播两大场景化方案,通过腾讯云服务向开发者开放,致力于帮助开发者快速搭建低成本、低延时、高品质的音视频互动解决方案。
领券
问题归档专栏文章快讯文章归档关键词归档开发者手册归档开发者手册 Section 归档