網(wǎng)站首頁 編程語言 正文
FFmpeg有封裝圖像的常用操作,位于libavutil/imgutils.c,包括圖像拷貝、圖像填充、獲取圖像大小、分配圖像、檢測圖像寬高比是否有效。在視頻圖像縮放、像素格式轉(zhuǎn)換、視頻截圖保存等操作,經(jīng)常需要用到圖像操作方法。
一、獲取圖像大小
1、av_image_get_linesize
根據(jù)圖像寬與像素格式,獲取一行圖像大小
int av_image_get_linesize(enum AVPixelFormat pix_fmt, int width, int plane)
{
const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
int max_step [4]; /* max pixel step for each plane */
int max_step_comp[4]; /* the component for each plane which has the max pixel step */
if (!desc || desc->flags & AV_PIX_FMT_FLAG_HWACCEL)
return AVERROR(EINVAL);
av_image_fill_max_pixsteps(max_step, max_step_comp, desc);
return image_get_linesize(width, plane, max_step[plane], max_step_comp[plane], desc);
}
2、av_image_fill_linesizes
在av_image_get_linesize()基礎上,獲取每行圖像大小:
int av_image_fill_linesizes(int linesizes[4], enum AVPixelFormat pix_fmt, int width)
{
int i, ret;
const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
int max_step [4]; /* max pixel step for each plane */
int max_step_comp[4]; /* the component for each plane which has the max pixel step */
memset(linesizes, 0, 4*sizeof(linesizes[0]));
if (!desc || desc->flags & AV_PIX_FMT_FLAG_HWACCEL)
return AVERROR(EINVAL);
av_image_fill_max_pixsteps(max_step, max_step_comp, desc);
for (i = 0; i < 4; i++) {
if ((ret = image_get_linesize(width, i, max_step[i], max_step_comp[i], desc)) < 0)
return ret;
linesizes[i] = ret;
}
return 0;
}
3、av_image_fill_plane_sizes
根據(jù)圖像的高、每行大小、像素格式,計算每個圖像平面的大小:
int av_image_fill_plane_sizes(size_t sizes[4], enum AVPixelFormat pix_fmt,
int height, const ptrdiff_t linesizes[4])
{
int i, has_plane[4] = { 0 };
const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
memset(sizes , 0, sizeof(sizes[0])*4);
if (!desc || desc->flags & AV_PIX_FMT_FLAG_HWACCEL)
return AVERROR(EINVAL);
if (linesizes[0] > SIZE_MAX / height)
return AVERROR(EINVAL);
sizes[0] = linesizes[0] * (size_t)height;
if (desc->flags & AV_PIX_FMT_FLAG_PAL ||
desc->flags & FF_PSEUDOPAL) {
sizes[1] = 256 * 4; /* palette is stored here as 256 32 bits words */
return 0;
}
for (i = 0; i < 4; i++)
has_plane[desc->comp[i].plane] = 1;
for (i = 1; i < 4 && has_plane[i]; i++) {
int h, s = (i == 1 || i == 2) ? desc->log2_chroma_h : 0;
h = (height + (1 << s) - 1) >> s;
if (linesizes[i] > SIZE_MAX / h)
return AVERROR(EINVAL);
sizes[i] = (size_t)h * linesizes[i];
}
return 0;
}
4、av_image_get_buffer_size
根據(jù)圖像寬高與像素格式,獲取圖像大小,支持配置是否對齊模式:
int av_image_get_buffer_size(enum AVPixelFormat pix_fmt,
int width, int height, int align)
{
int ret, i;
int linesize[4];
ptrdiff_t aligned_linesize[4];
size_t sizes[4];
const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
if (!desc)
return AVERROR(EINVAL);
ret = av_image_check_size(width, height, 0, NULL);
if (ret < 0)
return ret;
if (desc->flags & FF_PSEUDOPAL)
return FFALIGN(width, align) * height;
ret = av_image_fill_linesizes(linesize, pix_fmt, width);
if (ret < 0)
return ret;
for (i = 0; i < 4; i++)
aligned_linesize[i] = FFALIGN(linesize[i], align);
ret = av_image_fill_plane_sizes(sizes, pix_fmt, height, aligned_linesize);
if (ret < 0)
return ret;
ret = 0;
for (i = 0; i < 4; i++) {
if (sizes[i] > INT_MAX - ret)
return AVERROR(EINVAL);
ret += sizes[i];
}
return ret;
}
二、圖像填充
1、av_image_fill_arrays
使用源圖像,結(jié)合圖像寬、高、像素格式,填充目標圖像數(shù)據(jù):
int av_image_fill_arrays(uint8_t *dst_data[4], int dst_linesize[4],
const uint8_t *src, enum AVPixelFormat pix_fmt,
int width, int height, int align)
{
int ret, i;
ret = av_image_check_size(width, height, 0, NULL);
if (ret < 0)
return ret;
ret = av_image_fill_linesizes(dst_linesize, pix_fmt, width);
if (ret < 0)
return ret;
for (i = 0; i < 4; i++)
dst_linesize[i] = FFALIGN(dst_linesize[i], align);
return av_image_fill_pointers(dst_data, pix_fmt, height, (uint8_t *)src, dst_linesize);
}
2、av_image_fill_black
填充圖像為黑色,如果有透明通道,就重置為不透明:
int av_image_fill_black(uint8_t *dst_data[4], const ptrdiff_t dst_linesize[4],
enum AVPixelFormat pix_fmt, enum AVColorRange range,
int width, int height)
{
const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
int nb_planes = av_pix_fmt_count_planes(pix_fmt);
// A pixel or a group of pixels on each plane, with a value that represents black.
uint8_t clear_block[4][MAX_BLOCK_SIZE] = {{0}}; // clear padding with 0
int clear_block_size[4] = {0};
ptrdiff_t plane_line_bytes[4] = {0};
int rgb, limited;
int plane, c;
if (!desc || nb_planes < 1 || nb_planes > 4 || desc->flags & AV_PIX_FMT_FLAG_HWACCEL)
return AVERROR(EINVAL);
rgb = !!(desc->flags & AV_PIX_FMT_FLAG_RGB);
limited = !rgb && range != AVCOL_RANGE_JPEG;
if (desc->flags & AV_PIX_FMT_FLAG_BITSTREAM) {
ptrdiff_t bytewidth = av_image_get_linesize(pix_fmt, width, 0);
uint8_t *data;
int mono = pix_fmt == AV_PIX_FMT_MONOWHITE || pix_fmt == AV_PIX_FMT_MONOBLACK;
int fill = pix_fmt == AV_PIX_FMT_MONOWHITE ? 0xFF : 0;
if (nb_planes != 1 || !(rgb || mono) || bytewidth < 1)
return AVERROR(EINVAL);
if (!dst_data)
return 0;
data = dst_data[0];
// (Bitstream + alpha will be handled incorrectly - it'll remain transparent.)
for (;height > 0; height--) {
memset(data, fill, bytewidth);
data += dst_linesize[0];
}
return 0;
}
for (c = 0; c < desc->nb_components; c++) {
const AVComponentDescriptor comp = desc->comp[c];
// We try to operate on entire non-subsampled pixel groups (for
// AV_PIX_FMT_UYVY422 this would mean two consecutive pixels).
clear_block_size[comp.plane] = FFMAX(clear_block_size[comp.plane], comp.step);
if (clear_block_size[comp.plane] > MAX_BLOCK_SIZE)
return AVERROR(EINVAL);
}
// Create a byte array for clearing 1 pixel (sometimes several pixels).
for (c = 0; c < desc->nb_components; c++) {
const AVComponentDescriptor comp = desc->comp[c];
// (Multiple pixels happen e.g. with AV_PIX_FMT_UYVY422.)
int w = clear_block_size[comp.plane] / comp.step;
uint8_t *c_data[4];
const int c_linesize[4] = {0};
uint16_t src_array[MAX_BLOCK_SIZE];
uint16_t src = 0;
int x;
if (comp.depth > 16)
return AVERROR(EINVAL);
if (!rgb && comp.depth < 8)
return AVERROR(EINVAL);
if (w < 1)
return AVERROR(EINVAL);
if (c == 0 && limited) {
src = 16 << (comp.depth - 8);
} else if ((c == 1 || c == 2) && !rgb) {
src = 128 << (comp.depth - 8);
} else if (c == 3) {
// (Assume even limited YUV uses full range alpha.)
src = (1 << comp.depth) - 1;
}
for (x = 0; x < w; x++)
src_array[x] = src;
for (x = 0; x < 4; x++)
c_data[x] = &clear_block[x][0];
av_write_image_line(src_array, c_data, c_linesize, desc, 0, 0, c, w);
}
for (plane = 0; plane < nb_planes; plane++) {
plane_line_bytes[plane] = av_image_get_linesize(pix_fmt, width, plane);
if (plane_line_bytes[plane] < 0)
return AVERROR(EINVAL);
}
if (!dst_data)
return 0;
for (plane = 0; plane < nb_planes; plane++) {
size_t bytewidth = plane_line_bytes[plane];
uint8_t *data = dst_data[plane];
int chroma_div = plane == 1 || plane == 2 ? desc->log2_chroma_h : 0;
int plane_h = ((height + ( 1 << chroma_div) - 1)) >> chroma_div;
for (; plane_h > 0; plane_h--) {
memset_bytes(data, bytewidth, &clear_block[plane][0], clear_block_size[plane]);
data += dst_linesize[plane];
}
}
return 0;
}
三、圖像拷貝
1、av_image_copy_plane
拷貝圖像平面的像素數(shù)據(jù):
static void image_copy_plane(uint8_t *dst, ptrdiff_t dst_linesize,
const uint8_t *src, ptrdiff_t src_linesize,
ptrdiff_t bytewidth, int height)
{
if (!dst || !src)
return;
av_assert0(FFABS(src_linesize) >= bytewidth);
av_assert0(FFABS(dst_linesize) >= bytewidth);
// 逐行拷貝
for (;height > 0; height--) {
memcpy(dst, src, bytewidth);
dst += dst_linesize;
src += src_linesize;
}
}
void av_image_copy_plane(uint8_t *dst, int dst_linesize,
const uint8_t *src, int src_linesize,
int bytewidth, int height)
{
image_copy_plane(dst, dst_linesize, src, src_linesize, bytewidth, height);
}
2、av_image_copy
根據(jù)圖像的寬、高、像素格式,進行圖像拷貝:
void av_image_copy(uint8_t *dst_data[4], int dst_linesizes[4],
const uint8_t *src_data[4], const int src_linesizes[4],
enum AVPixelFormat pix_fmt, int width, int height)
{
ptrdiff_t dst_linesizes1[4], src_linesizes1[4];
int i;
for (i = 0; i < 4; i++) {
dst_linesizes1[i] = dst_linesizes[i];
src_linesizes1[i] = src_linesizes[i];
}
image_copy(dst_data, dst_linesizes1, src_data, src_linesizes1, pix_fmt,
width, height, image_copy_plane);
}
3、av_image_copy_to_buffer
把圖像數(shù)據(jù)拷貝到指定緩沖區(qū):
int av_image_copy_to_buffer(uint8_t *dst, int dst_size,
const uint8_t * const src_data[4],
const int src_linesize[4],
enum AVPixelFormat pix_fmt,
int width, int height, int align)
{
int i, j, nb_planes = 0, linesize[4];
int size = av_image_get_buffer_size(pix_fmt, width, height, align);
const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
int ret;
if (size > dst_size || size < 0 || !desc)
return AVERROR(EINVAL);
// 計算plane平面數(shù)量
for (i = 0; i < desc->nb_components; i++)
nb_planes = FFMAX(desc->comp[i].plane, nb_planes);
nb_planes++;
// 計算每行所占空間大小
ret = av_image_fill_linesizes(linesize, pix_fmt, width);
av_assert0(ret >= 0); // was checked previously
for (i = 0; i < nb_planes; i++) {
int h, shift = (i == 1 || i == 2) ? desc->log2_chroma_h : 0;
const uint8_t *src = src_data[i];
h = (height + (1 << shift) - 1) >> shift;
// 逐行拷貝
for (j = 0; j < h; j++) {
memcpy(dst, src, linesize[i]);
dst += FFALIGN(linesize[i], align);
src += src_linesize[i];
}
}
if (desc->flags & AV_PIX_FMT_FLAG_PAL) {
uint32_t *d32 = (uint32_t *)dst;
for (i = 0; i<256; i++)
AV_WL32(d32 + i, AV_RN32(src_data[1] + 4*i));
}
return size;
}
四、圖像分配
1、av_image_alloc
根據(jù)圖像的寬、高、像素格式來分配內(nèi)存,代碼如下:
int av_image_alloc(uint8_t *pointers[4], int linesizes[4],
int w, int h, enum AVPixelFormat pix_fmt, int align)
{
const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
int i, ret;
ptrdiff_t linesizes1[4];
size_t total_size, sizes[4];
uint8_t *buf;
if (!desc)
return AVERROR(EINVAL);
if ((ret = av_image_check_size(w, h, 0, NULL)) < 0)
return ret;
if ((ret = av_image_fill_linesizes(linesizes, pix_fmt, align>7 ? FFALIGN(w, 8) : w)) < 0)
return ret;
for (i = 0; i < 4; i++) {
linesizes[i] = FFALIGN(linesizes[i], align);
linesizes1[i] = linesizes[i];
}
if ((ret = av_image_fill_plane_sizes(sizes, pix_fmt, h, linesizes1)) < 0)
return ret;
total_size = align;
for (i = 0; i < 4; i++) {
if (total_size > SIZE_MAX - sizes[i])
return AVERROR(EINVAL);
total_size += sizes[i];
}
buf = av_malloc(total_size);
if (!buf)
return AVERROR(ENOMEM);
if ((ret = av_image_fill_pointers(pointers, pix_fmt, h, buf, linesizes)) < 0) {
av_free(buf);
return ret;
}
if (desc->flags & AV_PIX_FMT_FLAG_PAL || (desc->flags & FF_PSEUDOPAL && pointers[1])) {
avpriv_set_systematic_pal2((uint32_t*)pointers[1], pix_fmt);
if (align < 4) {
av_log(NULL, AV_LOG_ERROR, "Formats with a palette require a minimum alignment of 4\n");
av_free(buf);
return AVERROR(EINVAL);
}
}
if ((desc->flags & AV_PIX_FMT_FLAG_PAL ||
desc->flags & FF_PSEUDOPAL) && pointers[1] &&
pointers[1] - pointers[0] > linesizes[0] * h) {
/* zero-initialize the padding before the palette */
memset(pointers[0] + linesizes[0] * h, 0,
pointers[1] - pointers[0] - linesizes[0] * h);
}
return ret;
}
五、檢測圖像是否有效
1、av_image_check_sar
根據(jù)圖像寬高比檢測圖像是否有效,sar代表sample aspect ratio:
int av_image_check_sar(unsigned int w, unsigned int h, AVRational sar)
{
int64_t scaled_dim;
if (sar.den <= 0 || sar.num < 0)
return AVERROR(EINVAL);
if (!sar.num || sar.num == sar.den)
return 0;
if (sar.num < sar.den)
scaled_dim = av_rescale_rnd(w, sar.num, sar.den, AV_ROUND_ZERO);
else
scaled_dim = av_rescale_rnd(h, sar.den, sar.num, AV_ROUND_ZERO);
if (scaled_dim > 0)
return 0;
return AVERROR(EINVAL);
}
六、圖像操作實例
當解碼出一個視頻幀后,需要判斷是否支持渲染的像素格式,當然也可以在OpenGL渲染層適配不同的像素格式。以下實例是Android平臺使用FFmpeg解碼,判斷到像素格式不支持則轉(zhuǎn)換,如果支持直接拷貝到輸出緩沖區(qū):
int putFrameToBuffer(JNIEnv *env, AVCodecContext *context, AVFrame *frame,
jobject outputBuffer) {
int outputLineSize[4];
int outputFormat = frame->format;
bool isFormatSupported = false;
int supportFormats[] = {AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUVJ420P, AV_PIX_FMT_YUV420P10LE};
// 判斷是否為常見像素格式
for (int i = 0; i < 3; i++) {
if (supportFormats[i] == frame->format) {
isFormatSupported = true;
break;
}
}
// 如果不支持,指定輸出像素格式為YUV420P
if (!isFormatSupported) {
outputFormat = AV_PIX_FMT_YUV420P;
}
// 計算圖像的每行大小
av_image_fill_linesizes(outputLineSize, (enum AVPixelFormat)(outputFormat), frame->width);
jboolean initResult = (*env)->CallBooleanMethod(env,
outputBuffer,
initForYuvFrame,
frame->width,
frame->height,
outputLineSize[0],
outputLineSize[1]);
if ((*env)->ExceptionCheck(env) || !initResult) {
return OUTPUT_BUFFER_ALLOCATE_FAILED;
}
const jobject dataObject = (*env)->GetObjectField(env, outputBuffer, dataField);
jbyte *const data = (jbyte *)((*env)->GetDirectBufferAddress(env, dataObject));
// 如果不支持,進行像素格式轉(zhuǎn)換;如果支持,直接拷貝到輸出緩沖區(qū)
if (!isFormatSupported) {
struct SwsContext *swsContext = context->opaque;
uint8_t *dst_data[4];
av_image_fill_pointers(dst_data,
(enum AVPixelFormat) outputFormat,
frame->height,
(uint8_t *) data,
outputLineSize);
// 像素格式轉(zhuǎn)換
sws_scale(swsContext,
(const uint8_t **) frame->data,
frame->linesize,
0,
frame->height,
dst_data,
outputLineSize);
} else {
// 計算緩沖區(qū)大小
int outputSize = av_image_get_buffer_size((enum AVPixelFormat) frame->format,
frame->width,
frame->height,
1);
// 拷貝到輸出緩沖區(qū)
av_image_copy_to_buffer((uint8_t *) data,
outputSize,
frame->data,
frame->linesize,
(enum AVPixelFormat) frame->format,
frame->width,
frame->height,
1);
}
return NO_ERROR;
}
原文鏈接:https://blog.csdn.net/tonychan129/article/details/127033199
相關推薦
- 2022-11-27 Go?微服務開發(fā)框架DMicro設計思路詳解_Golang
- 2022-07-14 詳解HBase表的數(shù)據(jù)模型_其它綜合
- 2022-09-15 .Net站點設置多個路由對應同一個Action_實用技巧
- 2022-08-11 Go語言Grpc?Stream的實現(xiàn)_Golang
- 2022-08-04 python中可以發(fā)生異常自動重試庫retrying_python
- 2023-07-14 express+mongoose實現(xiàn)無限級分類
- 2022-03-20 如何在Go中將[]byte轉(zhuǎn)換為io.Reader_Golang
- 2022-08-16 c#中使用BackgroundWorker的實現(xiàn)_C#教程
- 最近更新
-
- window11 系統(tǒng)安裝 yarn
- 超詳細win安裝深度學習環(huán)境2025年最新版(
- Linux 中運行的top命令 怎么退出?
- MySQL 中decimal 的用法? 存儲小
- get 、set 、toString 方法的使
- @Resource和 @Autowired注解
- Java基礎操作-- 運算符,流程控制 Flo
- 1. Int 和Integer 的區(qū)別,Jav
- spring @retryable不生效的一種
- Spring Security之認證信息的處理
- Spring Security之認證過濾器
- Spring Security概述快速入門
- Spring Security之配置體系
- 【SpringBoot】SpringCache
- Spring Security之基于方法配置權
- redisson分布式鎖中waittime的設
- maven:解決release錯誤:Artif
- restTemplate使用總結(jié)
- Spring Security之安全異常處理
- MybatisPlus優(yōu)雅實現(xiàn)加密?
- Spring ioc容器與Bean的生命周期。
- 【探索SpringCloud】服務發(fā)現(xiàn)-Nac
- Spring Security之基于HttpR
- Redis 底層數(shù)據(jù)結(jié)構(gòu)-簡單動態(tài)字符串(SD
- arthas操作spring被代理目標對象命令
- Spring中的單例模式應用詳解
- 聊聊消息隊列,發(fā)送消息的4種方式
- bootspring第三方資源配置管理
- GIT同步修改后的遠程分支