/src/aom/aom_dsp/pyramid.c

Source (jump to first uncovered line)
/*
 * Copyright (c) 2022, Alliance for Open Media. All rights reserved.
 *
 * This source code is subject to the terms of the BSD 2 Clause License and
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
 * was not distributed with this source code in the LICENSE file, you can
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
 * Media Patent License 1.0 was not distributed with this source code in the
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
 */

#include "aom_dsp/pyramid.h"
#include "aom_mem/aom_mem.h"
#include "aom_ports/bitops.h"
#include "aom_util/aom_pthread.h"

// TODO(rachelbarker): Move needed code from av1/ to aom_dsp/
#include "av1/common/resize.h"

#include <assert.h>
#include <string.h>

// Lifecycle:
// * Frame buffer alloc code calls aom_get_pyramid_alloc_size()
//   to work out how much space is needed for a given number of pyramid
//   levels. This is counted in the size checked against the max allocation
//   limit
// * Then calls aom_alloc_pyramid() to actually create the pyramid
// * Pyramid is initially marked as containing no valid data
// * Each pyramid layer is computed on-demand, the first time it is requested
// * Whenever frame buffer is reused, reset the counter of filled levels.
//   This invalidates all of the existing pyramid levels.
// * Whenever frame buffer is resized, reallocate pyramid

size_t aom_get_pyramid_alloc_size(int width, int height, bool image_is_16bit) {
  // Allocate the maximum possible number of layers for this width and height
  const int msb = get_msb(AOMMIN(width, height));
  const int n_levels = AOMMAX(msb - MIN_PYRAMID_SIZE_LOG2, 1);

  size_t alloc_size = 0;
  alloc_size += sizeof(ImagePyramid);
  alloc_size += n_levels * sizeof(PyramidLayer);

  // Calculate how much memory is needed for downscaled frame buffers
  size_t buffer_size = 0;

  // Work out if we need to allocate a few extra bytes for alignment.
  // aom_memalign() will ensure that the start of the allocation is aligned
  // to a multiple of PYRAMID_ALIGNMENT. But we want the first image pixel
  // to be aligned, not the first byte of the allocation.
  //
  // In the loop below, we ensure that the stride of every image is a multiple
  // of PYRAMID_ALIGNMENT. Thus the allocated size of each pyramid level will
  // also be a multiple of PYRAMID_ALIGNMENT. Thus, as long as we can get the
  // first pixel in the first pyramid layer aligned properly, that will
  // automatically mean that the first pixel of every row of every layer is
  // properly aligned too.
  //
  // Thus all we need to consider is the first pixel in the first layer.
  // This is located at offset
  //   extra_bytes + level_stride * PYRAMID_PADDING + PYRAMID_PADDING
  // bytes into the buffer. Since level_stride is a multiple of
  // PYRAMID_ALIGNMENT, we can ignore that. So we need
  //   extra_bytes + PYRAMID_PADDING = multiple of PYRAMID_ALIGNMENT
  //
  // To solve this, we can round PYRAMID_PADDING up to the next multiple
  // of PYRAMID_ALIGNMENT, then subtract the orginal value to calculate
  // how many extra bytes are needed.
  size_t first_px_offset =
      (PYRAMID_PADDING + PYRAMID_ALIGNMENT - 1) & ~(PYRAMID_ALIGNMENT - 1);
  size_t extra_bytes = first_px_offset - PYRAMID_PADDING;
  buffer_size += extra_bytes;

  // If the original image is stored in an 8-bit buffer, then we can point the
  // lowest pyramid level at that buffer rather than allocating a new one.
  int first_allocated_level = image_is_16bit ? 0 : 1;

  for (int level = first_allocated_level; level < n_levels; level++) {
    int level_width = width >> level;
    int level_height = height >> level;

    // Allocate padding for each layer
    int padded_width = level_width + 2 * PYRAMID_PADDING;
    int padded_height = level_height + 2 * PYRAMID_PADDING;

    // Align the layer stride to be a multiple of PYRAMID_ALIGNMENT
    // This ensures that, as long as the top-left pixel in this pyramid level is
    // properly aligned, then so will the leftmost pixel in every row of the
    // pyramid level.
    int level_stride =
        (padded_width + PYRAMID_ALIGNMENT - 1) & ~(PYRAMID_ALIGNMENT - 1);

    buffer_size += level_stride * padded_height;
  }

  alloc_size += buffer_size;

  return alloc_size;
}

ImagePyramid *aom_alloc_pyramid(int width, int height, bool image_is_16bit) {
  // Allocate the maximum possible number of layers for this width and height
  const int msb = get_msb(AOMMIN(width, height));
  const int n_levels = AOMMAX(msb - MIN_PYRAMID_SIZE_LOG2, 1);

  ImagePyramid *pyr = aom_calloc(1, sizeof(*pyr));
  if (!pyr) {
    return NULL;
  }

  pyr->layers = aom_calloc(n_levels, sizeof(*pyr->layers));
  if (!pyr->layers) {
    aom_free(pyr);
    return NULL;
  }

  pyr->max_levels = n_levels;
  pyr->filled_levels = 0;

  // Compute sizes and offsets for each pyramid level
  // These are gathered up first, so that we can allocate all pyramid levels
  // in a single buffer
  size_t buffer_size = 0;
  size_t *layer_offsets = aom_calloc(n_levels, sizeof(*layer_offsets));
  if (!layer_offsets) {
    aom_free(pyr->layers);
    aom_free(pyr);
    return NULL;
  }

  // Work out if we need to allocate a few extra bytes for alignment.
  // aom_memalign() will ensure that the start of the allocation is aligned
  // to a multiple of PYRAMID_ALIGNMENT. But we want the first image pixel
  // to be aligned, not the first byte of the allocation.
  //
  // In the loop below, we ensure that the stride of every image is a multiple
  // of PYRAMID_ALIGNMENT. Thus the allocated size of each pyramid level will
  // also be a multiple of PYRAMID_ALIGNMENT. Thus, as long as we can get the
  // first pixel in the first pyramid layer aligned properly, that will
  // automatically mean that the first pixel of every row of every layer is
  // properly aligned too.
  //
  // Thus all we need to consider is the first pixel in the first layer.
  // This is located at offset
  //   extra_bytes + level_stride * PYRAMID_PADDING + PYRAMID_PADDING
  // bytes into the buffer. Since level_stride is a multiple of
  // PYRAMID_ALIGNMENT, we can ignore that. So we need
  //   extra_bytes + PYRAMID_PADDING = multiple of PYRAMID_ALIGNMENT
  //
  // To solve this, we can round PYRAMID_PADDING up to the next multiple
  // of PYRAMID_ALIGNMENT, then subtract the orginal value to calculate
  // how many extra bytes are needed.
  size_t first_px_offset =
      (PYRAMID_PADDING + PYRAMID_ALIGNMENT - 1) & ~(PYRAMID_ALIGNMENT - 1);
  size_t extra_bytes = first_px_offset - PYRAMID_PADDING;
  buffer_size += extra_bytes;

  // If the original image is stored in an 8-bit buffer, then we can point the
  // lowest pyramid level at that buffer rather than allocating a new one.
  int first_allocated_level = image_is_16bit ? 0 : 1;

  for (int level = first_allocated_level; level < n_levels; level++) {
    PyramidLayer *layer = &pyr->layers[level];

    int level_width = width >> level;
    int level_height = height >> level;

    // Allocate padding for each layer
    int padded_width = level_width + 2 * PYRAMID_PADDING;
    int padded_height = level_height + 2 * PYRAMID_PADDING;

    // Align the layer stride to be a multiple of PYRAMID_ALIGNMENT
    // This ensures that, as long as the top-left pixel in this pyramid level is
    // properly aligned, then so will the leftmost pixel in every row of the
    // pyramid level.
    int level_stride =
        (padded_width + PYRAMID_ALIGNMENT - 1) & ~(PYRAMID_ALIGNMENT - 1);

    size_t level_alloc_start = buffer_size;
    size_t level_start =
        level_alloc_start + PYRAMID_PADDING * level_stride + PYRAMID_PADDING;

    buffer_size += level_stride * padded_height;

    layer_offsets[level] = level_start;
    layer->width = level_width;
    layer->height = level_height;
    layer->stride = level_stride;
  }

  pyr->buffer_alloc =
      aom_memalign(PYRAMID_ALIGNMENT, buffer_size * sizeof(*pyr->buffer_alloc));
  if (!pyr->buffer_alloc) {
    aom_free(pyr->layers);
    aom_free(pyr);
    aom_free(layer_offsets);
    return NULL;
  }

  // Fill in pointers for each level
  // If image is 8-bit, then the lowest level is left unconfigured for now,
  // and will be set up properly when the pyramid is filled in
  for (int level = first_allocated_level; level < n_levels; level++) {
    PyramidLayer *layer = &pyr->layers[level];
    layer->buffer = pyr->buffer_alloc + layer_offsets[level];
  }

#if CONFIG_MULTITHREAD
  pthread_mutex_init(&pyr->mutex, NULL);
#endif  // CONFIG_MULTITHREAD

  aom_free(layer_offsets);
  return pyr;
}

// Fill the border region of a pyramid frame.
// This must be called after the main image area is filled out.
// `img_buf` should point to the first pixel in the image area,
// ie. it should be pyr->level_buffer + pyr->level_loc[level].
static inline void fill_border(uint8_t *img_buf, const int width,
                               const int height, const int stride) {
  // Fill left and right areas
  for (int row = 0; row < height; row++) {
    uint8_t *row_start = &img_buf[row * stride];
    uint8_t left_pixel = row_start[0];
    memset(row_start - PYRAMID_PADDING, left_pixel, PYRAMID_PADDING);
    uint8_t right_pixel = row_start[width - 1];
    memset(row_start + width, right_pixel, PYRAMID_PADDING);
  }

  // Fill top area
  for (int row = -PYRAMID_PADDING; row < 0; row++) {
    uint8_t *row_start = &img_buf[row * stride];
    memcpy(row_start - PYRAMID_PADDING, img_buf - PYRAMID_PADDING,
           width + 2 * PYRAMID_PADDING);
  }

  // Fill bottom area
  uint8_t *last_row_start = &img_buf[(height - 1) * stride];
  for (int row = height; row < height + PYRAMID_PADDING; row++) {
    uint8_t *row_start = &img_buf[row * stride];
    memcpy(row_start - PYRAMID_PADDING, last_row_start - PYRAMID_PADDING,
           width + 2 * PYRAMID_PADDING);
  }
}

// Compute downsampling pyramid for a frame
//
// This function will ensure that the first `n_levels` levels of the pyramid
// are filled, unless the frame is too small to have this many levels.
// In that case, we will fill all available levels and then stop.
//
// Returns the actual number of levels filled, capped at n_levels,
// or -1 on error.
//
// This must only be called while holding frame_pyr->mutex
static inline int fill_pyramid(const YV12_BUFFER_CONFIG *frame, int bit_depth,
                               int n_levels, ImagePyramid *frame_pyr) {
  int already_filled_levels = frame_pyr->filled_levels;

  // This condition should already be enforced by aom_compute_pyramid
  assert(n_levels <= frame_pyr->max_levels);

  if (already_filled_levels >= n_levels) {
    return n_levels;
  }

  const int frame_width = frame->y_crop_width;
  const int frame_height = frame->y_crop_height;
  const int frame_stride = frame->y_stride;
  assert((frame_width >> n_levels) >= 0);
  assert((frame_height >> n_levels) >= 0);

  if (already_filled_levels == 0) {
    // Fill in largest level from the original image
    PyramidLayer *first_layer = &frame_pyr->layers[0];
    if (frame->flags & YV12_FLAG_HIGHBITDEPTH) {
      // For frames stored in a 16-bit buffer, we need to downconvert to 8 bits
      assert(first_layer->width == frame_width);
      assert(first_layer->height == frame_height);

      uint16_t *frame_buffer = CONVERT_TO_SHORTPTR(frame->y_buffer);
      uint8_t *pyr_buffer = first_layer->buffer;
      int pyr_stride = first_layer->stride;
      for (int y = 0; y < frame_height; y++) {
        uint16_t *frame_row = frame_buffer + y * frame_stride;
        uint8_t *pyr_row = pyr_buffer + y * pyr_stride;
        for (int x = 0; x < frame_width; x++) {
          pyr_row[x] = frame_row[x] >> (bit_depth - 8);
        }
      }

      fill_border(pyr_buffer, frame_width, frame_height, pyr_stride);
    } else {
      // For frames stored in an 8-bit buffer, we don't need to copy anything -
      // we can just reference the original image buffer
      first_layer->buffer = frame->y_buffer;
      first_layer->width = frame_width;
      first_layer->height = frame_height;
      first_layer->stride = frame_stride;
    }

    already_filled_levels = 1;
  }

  // Fill in the remaining levels through progressive downsampling
  for (int level = already_filled_levels; level < n_levels; ++level) {
    bool mem_status = false;
    PyramidLayer *prev_layer = &frame_pyr->layers[level - 1];
    uint8_t *prev_buffer = prev_layer->buffer;
    int prev_stride = prev_layer->stride;

    PyramidLayer *this_layer = &frame_pyr->layers[level];
    uint8_t *this_buffer = this_layer->buffer;
    int this_width = this_layer->width;
    int this_height = this_layer->height;
    int this_stride = this_layer->stride;

    // The width and height of the previous layer that needs to be considered to
    // derive the current layer frame.
    const int input_layer_width = this_width << 1;
    const int input_layer_height = this_height << 1;

    // Compute the this pyramid level by downsampling the current level.
    //
    // We downsample by a factor of exactly 2, clipping the rightmost and
    // bottommost pixel off of the current level if needed. We do this for
    // two main reasons:
    //
    // 1) In the disflow code, when stepping from a higher pyramid level to a
    //    lower pyramid level, we need to not just interpolate the flow field
    //    but also to scale each flow vector by the upsampling ratio.
    //    So it is much more convenient if this ratio is simply 2.
    //
    // 2) Up/downsampling by a factor of 2 can be implemented much more
    //    efficiently than up/downsampling by a generic ratio.
    //    TODO(rachelbarker): Use optimized downsample-by-2 function

    // SIMD support has been added specifically for cases where the downsample
    // factor is exactly 2. In such instances, horizontal and vertical resizing
    // is performed utilizing the down2_symeven() function, which considers the
    // even dimensions of the input layer.
    if (should_resize_by_half(input_layer_height, input_layer_width,
                              this_height, this_width)) {
      assert(input_layer_height % 2 == 0 && input_layer_width % 2 == 0 &&
             "Input width or height cannot be odd.");
      mem_status = av1_resize_plane_to_half(
          prev_buffer, input_layer_height, input_layer_width, prev_stride,
          this_buffer, this_height, this_width, this_stride);
    } else {
      mem_status = av1_resize_plane(prev_buffer, input_layer_height,
                                    input_layer_width, prev_stride, this_buffer,
                                    this_height, this_width, this_stride);
    }

    // Terminate early in cases of memory allocation failure.
    if (!mem_status) {
      frame_pyr->filled_levels = n_levels;
      return -1;
    }

    fill_border(this_buffer, this_width, this_height, this_stride);
  }

  frame_pyr->filled_levels = n_levels;
  return n_levels;
}

// Fill out a downsampling pyramid for a given frame.
//
// The top level (index 0) will always be an 8-bit copy of the input frame,
// regardless of the input bit depth. Additional levels are then downscaled
// by powers of 2.
//
// This function will ensure that the first `n_levels` levels of the pyramid
// are filled, unless the frame is too small to have this many levels.
// In that case, we will fill all available levels and then stop.
// No matter how small the frame is, at least one level is guaranteed
// to be filled.
//
// Returns the actual number of levels filled, capped at n_levels,
// or -1 on error.
int aom_compute_pyramid(const YV12_BUFFER_CONFIG *frame, int bit_depth,
                        int n_levels, ImagePyramid *pyr) {
  assert(pyr);

  // Per the comments in the ImagePyramid struct, we must take this mutex
  // before reading or writing the filled_levels field, and hold it while
  // computing any additional pyramid levels, to ensure proper behaviour
  // when multithreading is used
#if CONFIG_MULTITHREAD
  pthread_mutex_lock(&pyr->mutex);
#endif  // CONFIG_MULTITHREAD

  n_levels = AOMMIN(n_levels, pyr->max_levels);
  int result = n_levels;
  if (pyr->filled_levels < n_levels) {
    // Compute any missing levels that we need
    result = fill_pyramid(frame, bit_depth, n_levels, pyr);
  }

  // At this point, as long as result >= 0, the requested number of pyramid
  // levels are guaranteed to be valid, and can be safely read from without
  // holding the mutex any further
  assert(IMPLIES(result >= 0, pyr->filled_levels >= n_levels));
#if CONFIG_MULTITHREAD
  pthread_mutex_unlock(&pyr->mutex);
#endif  // CONFIG_MULTITHREAD
  return result;
}

#ifndef NDEBUG
// Check if a pyramid has already been computed to at least n levels
// This is mostly a debug helper - as it is necessary to hold pyr->mutex
// while reading the number of already-computed levels, we cannot just write:
//   assert(pyr->filled_levels >= n_levels);
// This function allows the check to be correctly written as:
//   assert(aom_is_pyramid_valid(pyr, n_levels));
//
// Note: This deliberately does not restrict n_levels based on the maximum
// number of permitted levels for the frame size. This allows the check to
// catch cases where the caller forgets to handle the case where
// max_levels is less than the requested number of levels
bool aom_is_pyramid_valid(ImagePyramid *pyr, int n_levels) {
  assert(pyr);

  // Per the comments in the ImagePyramid struct, we must take this mutex
  // before reading or writing the filled_levels field, to ensure proper
  // behaviour when multithreading is used
#if CONFIG_MULTITHREAD
  pthread_mutex_lock(&pyr->mutex);
#endif  // CONFIG_MULTITHREAD

  bool result = (pyr->filled_levels >= n_levels);

#if CONFIG_MULTITHREAD
  pthread_mutex_unlock(&pyr->mutex);
#endif  // CONFIG_MULTITHREAD

  return result;
}
#endif

// Mark a pyramid as no longer containing valid data.
// This must be done whenever the corresponding frame buffer is reused
void aom_invalidate_pyramid(ImagePyramid *pyr) {
  if (pyr) {
#if CONFIG_MULTITHREAD
    pthread_mutex_lock(&pyr->mutex);
#endif  // CONFIG_MULTITHREAD
    pyr->filled_levels = 0;
#if CONFIG_MULTITHREAD
    pthread_mutex_unlock(&pyr->mutex);
#endif  // CONFIG_MULTITHREAD
  }
}

// Release the memory associated with a pyramid
void aom_free_pyramid(ImagePyramid *pyr) {
  if (pyr) {
#if CONFIG_MULTITHREAD
    pthread_mutex_destroy(&pyr->mutex);
#endif  // CONFIG_MULTITHREAD
    aom_free(pyr->buffer_alloc);
    aom_free(pyr->layers);
    aom_free(pyr);
  }
}

Coverage Report

Created: 2025-06-22 08:04

Line	Count	Source (jump to first uncovered line)
1		/*
2		* Copyright (c) 2022, Alliance for Open Media. All rights reserved.
3		*
4		* This source code is subject to the terms of the BSD 2 Clause License and
5		* the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6		* was not distributed with this source code in the LICENSE file, you can
7		* obtain it at www.aomedia.org/license/software. If the Alliance for Open
8		* Media Patent License 1.0 was not distributed with this source code in the
9		* PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10		*/
11
12		#include "aom_dsp/pyramid.h"
13		#include "aom_mem/aom_mem.h"
14		#include "aom_ports/bitops.h"
15		#include "aom_util/aom_pthread.h"
16
17		// TODO(rachelbarker): Move needed code from av1/ to aom_dsp/
18		#include "av1/common/resize.h"
19
20		#include <assert.h>
21		#include <string.h>
22
23		// Lifecycle:
24		// * Frame buffer alloc code calls aom_get_pyramid_alloc_size()
25		// to work out how much space is needed for a given number of pyramid
26		// levels. This is counted in the size checked against the max allocation
27		// limit
28		// * Then calls aom_alloc_pyramid() to actually create the pyramid
29		// * Pyramid is initially marked as containing no valid data
30		// * Each pyramid layer is computed on-demand, the first time it is requested
31		// * Whenever frame buffer is reused, reset the counter of filled levels.
32		// This invalidates all of the existing pyramid levels.
33		// * Whenever frame buffer is resized, reallocate pyramid
34
35	0	size_t aom_get_pyramid_alloc_size(int width, int height, bool image_is_16bit) {
36		// Allocate the maximum possible number of layers for this width and height
37	0	const int msb = get_msb(AOMMIN(width, height));
38	0	const int n_levels = AOMMAX(msb - MIN_PYRAMID_SIZE_LOG2, 1);
39
40	0	size_t alloc_size = 0;
41	0	alloc_size += sizeof(ImagePyramid);
42	0	alloc_size += n_levels * sizeof(PyramidLayer);
43
44		// Calculate how much memory is needed for downscaled frame buffers
45	0	size_t buffer_size = 0;
46
47		// Work out if we need to allocate a few extra bytes for alignment.
48		// aom_memalign() will ensure that the start of the allocation is aligned
49		// to a multiple of PYRAMID_ALIGNMENT. But we want the first image pixel
50		// to be aligned, not the first byte of the allocation.
51		//
52		// In the loop below, we ensure that the stride of every image is a multiple
53		// of PYRAMID_ALIGNMENT. Thus the allocated size of each pyramid level will
54		// also be a multiple of PYRAMID_ALIGNMENT. Thus, as long as we can get the
55		// first pixel in the first pyramid layer aligned properly, that will
56		// automatically mean that the first pixel of every row of every layer is
57		// properly aligned too.
58		//
59		// Thus all we need to consider is the first pixel in the first layer.
60		// This is located at offset
61		// extra_bytes + level_stride * PYRAMID_PADDING + PYRAMID_PADDING
62		// bytes into the buffer. Since level_stride is a multiple of
63		// PYRAMID_ALIGNMENT, we can ignore that. So we need
64		// extra_bytes + PYRAMID_PADDING = multiple of PYRAMID_ALIGNMENT
65		//
66		// To solve this, we can round PYRAMID_PADDING up to the next multiple
67		// of PYRAMID_ALIGNMENT, then subtract the orginal value to calculate
68		// how many extra bytes are needed.
69	0	size_t first_px_offset =
70	0	(PYRAMID_PADDING + PYRAMID_ALIGNMENT - 1) & ~(PYRAMID_ALIGNMENT - 1);
71	0	size_t extra_bytes = first_px_offset - PYRAMID_PADDING;
72	0	buffer_size += extra_bytes;
73
74		// If the original image is stored in an 8-bit buffer, then we can point the
75		// lowest pyramid level at that buffer rather than allocating a new one.
76	0	int first_allocated_level = image_is_16bit ? 0 : 1;
77
78	0	for (int level = first_allocated_level; level < n_levels; level++) {
79	0	int level_width = width >> level;
80	0	int level_height = height >> level;
81
82		// Allocate padding for each layer
83	0	int padded_width = level_width + 2 * PYRAMID_PADDING;
84	0	int padded_height = level_height + 2 * PYRAMID_PADDING;
85
86		// Align the layer stride to be a multiple of PYRAMID_ALIGNMENT
87		// This ensures that, as long as the top-left pixel in this pyramid level is
88		// properly aligned, then so will the leftmost pixel in every row of the
89		// pyramid level.
90	0	int level_stride =
91	0	(padded_width + PYRAMID_ALIGNMENT - 1) & ~(PYRAMID_ALIGNMENT - 1);
92
93	0	buffer_size += level_stride * padded_height;
94	0	}
95
96	0	alloc_size += buffer_size;
97
98	0	return alloc_size;
99	0	}
100
101	0	ImagePyramid *aom_alloc_pyramid(int width, int height, bool image_is_16bit) {
102		// Allocate the maximum possible number of layers for this width and height
103	0	const int msb = get_msb(AOMMIN(width, height));
104	0	const int n_levels = AOMMAX(msb - MIN_PYRAMID_SIZE_LOG2, 1);
105
106	0	ImagePyramid pyr = aom_calloc(1, sizeof(pyr));
107	0	if (!pyr) {
108	0	return NULL;
109	0	}
110
111	0	pyr->layers = aom_calloc(n_levels, sizeof(*pyr->layers));
112	0	if (!pyr->layers) {
113	0	aom_free(pyr);
114	0	return NULL;
115	0	}
116
117	0	pyr->max_levels = n_levels;
118	0	pyr->filled_levels = 0;
119
120		// Compute sizes and offsets for each pyramid level
121		// These are gathered up first, so that we can allocate all pyramid levels
122		// in a single buffer
123	0	size_t buffer_size = 0;
124	0	size_t layer_offsets = aom_calloc(n_levels, sizeof(layer_offsets));
125	0	if (!layer_offsets) {
126	0	aom_free(pyr->layers);
127	0	aom_free(pyr);
128	0	return NULL;
129	0	}
130
131		// Work out if we need to allocate a few extra bytes for alignment.
132		// aom_memalign() will ensure that the start of the allocation is aligned
133		// to a multiple of PYRAMID_ALIGNMENT. But we want the first image pixel
134		// to be aligned, not the first byte of the allocation.
135		//
136		// In the loop below, we ensure that the stride of every image is a multiple
137		// of PYRAMID_ALIGNMENT. Thus the allocated size of each pyramid level will
138		// also be a multiple of PYRAMID_ALIGNMENT. Thus, as long as we can get the
139		// first pixel in the first pyramid layer aligned properly, that will
140		// automatically mean that the first pixel of every row of every layer is
141		// properly aligned too.
142		//
143		// Thus all we need to consider is the first pixel in the first layer.
144		// This is located at offset
145		// extra_bytes + level_stride * PYRAMID_PADDING + PYRAMID_PADDING
146		// bytes into the buffer. Since level_stride is a multiple of
147		// PYRAMID_ALIGNMENT, we can ignore that. So we need
148		// extra_bytes + PYRAMID_PADDING = multiple of PYRAMID_ALIGNMENT
149		//
150		// To solve this, we can round PYRAMID_PADDING up to the next multiple
151		// of PYRAMID_ALIGNMENT, then subtract the orginal value to calculate
152		// how many extra bytes are needed.
153	0	size_t first_px_offset =
154	0	(PYRAMID_PADDING + PYRAMID_ALIGNMENT - 1) & ~(PYRAMID_ALIGNMENT - 1);
155	0	size_t extra_bytes = first_px_offset - PYRAMID_PADDING;
156	0	buffer_size += extra_bytes;
157
158		// If the original image is stored in an 8-bit buffer, then we can point the
159		// lowest pyramid level at that buffer rather than allocating a new one.
160	0	int first_allocated_level = image_is_16bit ? 0 : 1;
161
162	0	for (int level = first_allocated_level; level < n_levels; level++) {
163	0	PyramidLayer *layer = &pyr->layers[level];
164
165	0	int level_width = width >> level;
166	0	int level_height = height >> level;
167
168		// Allocate padding for each layer
169	0	int padded_width = level_width + 2 * PYRAMID_PADDING;
170	0	int padded_height = level_height + 2 * PYRAMID_PADDING;
171
172		// Align the layer stride to be a multiple of PYRAMID_ALIGNMENT
173		// This ensures that, as long as the top-left pixel in this pyramid level is
174		// properly aligned, then so will the leftmost pixel in every row of the
175		// pyramid level.
176	0	int level_stride =
177	0	(padded_width + PYRAMID_ALIGNMENT - 1) & ~(PYRAMID_ALIGNMENT - 1);
178
179	0	size_t level_alloc_start = buffer_size;
180	0	size_t level_start =
181	0	level_alloc_start + PYRAMID_PADDING * level_stride + PYRAMID_PADDING;
182
183	0	buffer_size += level_stride * padded_height;
184
185	0	layer_offsets[level] = level_start;
186	0	layer->width = level_width;
187	0	layer->height = level_height;
188	0	layer->stride = level_stride;
189	0	}
190
191	0	pyr->buffer_alloc =
192	0	aom_memalign(PYRAMID_ALIGNMENT, buffer_size * sizeof(*pyr->buffer_alloc));
193	0	if (!pyr->buffer_alloc) {
194	0	aom_free(pyr->layers);
195	0	aom_free(pyr);
196	0	aom_free(layer_offsets);
197	0	return NULL;
198	0	}
199
200		// Fill in pointers for each level
201		// If image is 8-bit, then the lowest level is left unconfigured for now,
202		// and will be set up properly when the pyramid is filled in
203	0	for (int level = first_allocated_level; level < n_levels; level++) {
204	0	PyramidLayer *layer = &pyr->layers[level];
205	0	layer->buffer = pyr->buffer_alloc + layer_offsets[level];
206	0	}
207
208	0	#if CONFIG_MULTITHREAD
209	0	pthread_mutex_init(&pyr->mutex, NULL);
210	0	#endif // CONFIG_MULTITHREAD
211
212	0	aom_free(layer_offsets);
213	0	return pyr;
214	0	}
215
216		// Fill the border region of a pyramid frame.
217		// This must be called after the main image area is filled out.
218		// `img_buf` should point to the first pixel in the image area,
219		// ie. it should be pyr->level_buffer + pyr->level_loc[level].
220		static inline void fill_border(uint8_t *img_buf, const int width,
221	0	const int height, const int stride) {
222		// Fill left and right areas
223	0	for (int row = 0; row < height; row++) {
224	0	uint8_t row_start = &img_buf[row stride];
225	0	uint8_t left_pixel = row_start[0];
226	0	memset(row_start - PYRAMID_PADDING, left_pixel, PYRAMID_PADDING);
227	0	uint8_t right_pixel = row_start[width - 1];
228	0	memset(row_start + width, right_pixel, PYRAMID_PADDING);
229	0	}
230
231		// Fill top area
232	0	for (int row = -PYRAMID_PADDING; row < 0; row++) {
233	0	uint8_t row_start = &img_buf[row stride];
234	0	memcpy(row_start - PYRAMID_PADDING, img_buf - PYRAMID_PADDING,
235	0	width + 2 * PYRAMID_PADDING);
236	0	}
237
238		// Fill bottom area
239	0	uint8_t last_row_start = &img_buf[(height - 1) stride];
240	0	for (int row = height; row < height + PYRAMID_PADDING; row++) {
241	0	uint8_t row_start = &img_buf[row stride];
242	0	memcpy(row_start - PYRAMID_PADDING, last_row_start - PYRAMID_PADDING,
243	0	width + 2 * PYRAMID_PADDING);
244	0	}
245	0	}
246
247		// Compute downsampling pyramid for a frame
248		//
249		// This function will ensure that the first `n_levels` levels of the pyramid
250		// are filled, unless the frame is too small to have this many levels.
251		// In that case, we will fill all available levels and then stop.
252		//
253		// Returns the actual number of levels filled, capped at n_levels,
254		// or -1 on error.
255		//
256		// This must only be called while holding frame_pyr->mutex
257		static inline int fill_pyramid(const YV12_BUFFER_CONFIG *frame, int bit_depth,
258	0	int n_levels, ImagePyramid *frame_pyr) {
259	0	int already_filled_levels = frame_pyr->filled_levels;
260
261		// This condition should already be enforced by aom_compute_pyramid
262	0	assert(n_levels <= frame_pyr->max_levels);
263
264	0	if (already_filled_levels >= n_levels) {
265	0	return n_levels;
266	0	}
267
268	0	const int frame_width = frame->y_crop_width;
269	0	const int frame_height = frame->y_crop_height;
270	0	const int frame_stride = frame->y_stride;
271	0	assert((frame_width >> n_levels) >= 0);
272	0	assert((frame_height >> n_levels) >= 0);
273
274	0	if (already_filled_levels == 0) {
275		// Fill in largest level from the original image
276	0	PyramidLayer *first_layer = &frame_pyr->layers[0];
277	0	if (frame->flags & YV12_FLAG_HIGHBITDEPTH) {
278		// For frames stored in a 16-bit buffer, we need to downconvert to 8 bits
279	0	assert(first_layer->width == frame_width);
280	0	assert(first_layer->height == frame_height);
281
282	0	uint16_t *frame_buffer = CONVERT_TO_SHORTPTR(frame->y_buffer);
283	0	uint8_t *pyr_buffer = first_layer->buffer;
284	0	int pyr_stride = first_layer->stride;
285	0	for (int y = 0; y < frame_height; y++) {
286	0	uint16_t frame_row = frame_buffer + y frame_stride;
287	0	uint8_t pyr_row = pyr_buffer + y pyr_stride;
288	0	for (int x = 0; x < frame_width; x++) {
289	0	pyr_row[x] = frame_row[x] >> (bit_depth - 8);
290	0	}
291	0	}
292
293	0	fill_border(pyr_buffer, frame_width, frame_height, pyr_stride);
294	0	} else {
295		// For frames stored in an 8-bit buffer, we don't need to copy anything -
296		// we can just reference the original image buffer
297	0	first_layer->buffer = frame->y_buffer;
298	0	first_layer->width = frame_width;
299	0	first_layer->height = frame_height;
300	0	first_layer->stride = frame_stride;
301	0	}
302
303	0	already_filled_levels = 1;
304	0	}
305
306		// Fill in the remaining levels through progressive downsampling
307	0	for (int level = already_filled_levels; level < n_levels; ++level) {
308	0	bool mem_status = false;
309	0	PyramidLayer *prev_layer = &frame_pyr->layers[level - 1];
310	0	uint8_t *prev_buffer = prev_layer->buffer;
311	0	int prev_stride = prev_layer->stride;
312
313	0	PyramidLayer *this_layer = &frame_pyr->layers[level];
314	0	uint8_t *this_buffer = this_layer->buffer;
315	0	int this_width = this_layer->width;
316	0	int this_height = this_layer->height;
317	0	int this_stride = this_layer->stride;
318
319		// The width and height of the previous layer that needs to be considered to
320		// derive the current layer frame.
321	0	const int input_layer_width = this_width << 1;
322	0	const int input_layer_height = this_height << 1;
323
324		// Compute the this pyramid level by downsampling the current level.
325		//
326		// We downsample by a factor of exactly 2, clipping the rightmost and
327		// bottommost pixel off of the current level if needed. We do this for
328		// two main reasons:
329		//
330		// 1) In the disflow code, when stepping from a higher pyramid level to a
331		// lower pyramid level, we need to not just interpolate the flow field
332		// but also to scale each flow vector by the upsampling ratio.
333		// So it is much more convenient if this ratio is simply 2.
334		//
335		// 2) Up/downsampling by a factor of 2 can be implemented much more
336		// efficiently than up/downsampling by a generic ratio.
337		// TODO(rachelbarker): Use optimized downsample-by-2 function
338
339		// SIMD support has been added specifically for cases where the downsample
340		// factor is exactly 2. In such instances, horizontal and vertical resizing
341		// is performed utilizing the down2_symeven() function, which considers the
342		// even dimensions of the input layer.
343	0	if (should_resize_by_half(input_layer_height, input_layer_width,
344	0	this_height, this_width)) {
345	0	assert(input_layer_height % 2 == 0 && input_layer_width % 2 == 0 &&
346	0	"Input width or height cannot be odd.");
347	0	mem_status = av1_resize_plane_to_half(
348	0	prev_buffer, input_layer_height, input_layer_width, prev_stride,
349	0	this_buffer, this_height, this_width, this_stride);
350	0	} else {
351	0	mem_status = av1_resize_plane(prev_buffer, input_layer_height,
352	0	input_layer_width, prev_stride, this_buffer,
353	0	this_height, this_width, this_stride);
354	0	}
355
356		// Terminate early in cases of memory allocation failure.
357	0	if (!mem_status) {
358	0	frame_pyr->filled_levels = n_levels;
359	0	return -1;
360	0	}
361
362	0	fill_border(this_buffer, this_width, this_height, this_stride);
363	0	}
364
365	0	frame_pyr->filled_levels = n_levels;
366	0	return n_levels;
367	0	}
368
369		// Fill out a downsampling pyramid for a given frame.
370		//
371		// The top level (index 0) will always be an 8-bit copy of the input frame,
372		// regardless of the input bit depth. Additional levels are then downscaled
373		// by powers of 2.
374		//
375		// This function will ensure that the first `n_levels` levels of the pyramid
376		// are filled, unless the frame is too small to have this many levels.
377		// In that case, we will fill all available levels and then stop.
378		// No matter how small the frame is, at least one level is guaranteed
379		// to be filled.
380		//
381		// Returns the actual number of levels filled, capped at n_levels,
382		// or -1 on error.
383		int aom_compute_pyramid(const YV12_BUFFER_CONFIG *frame, int bit_depth,
384	0	int n_levels, ImagePyramid *pyr) {
385	0	assert(pyr);
386
387		// Per the comments in the ImagePyramid struct, we must take this mutex
388		// before reading or writing the filled_levels field, and hold it while
389		// computing any additional pyramid levels, to ensure proper behaviour
390		// when multithreading is used
391	0	#if CONFIG_MULTITHREAD
392	0	pthread_mutex_lock(&pyr->mutex);
393	0	#endif // CONFIG_MULTITHREAD
394
395	0	n_levels = AOMMIN(n_levels, pyr->max_levels);
396	0	int result = n_levels;
397	0	if (pyr->filled_levels < n_levels) {
398		// Compute any missing levels that we need
399	0	result = fill_pyramid(frame, bit_depth, n_levels, pyr);
400	0	}
401
402		// At this point, as long as result >= 0, the requested number of pyramid
403		// levels are guaranteed to be valid, and can be safely read from without
404		// holding the mutex any further
405	0	assert(IMPLIES(result >= 0, pyr->filled_levels >= n_levels));
406	0	#if CONFIG_MULTITHREAD
407	0	pthread_mutex_unlock(&pyr->mutex);
408	0	#endif // CONFIG_MULTITHREAD
409	0	return result;
410	0	}
411
412		#ifndef NDEBUG
413		// Check if a pyramid has already been computed to at least n levels
414		// This is mostly a debug helper - as it is necessary to hold pyr->mutex
415		// while reading the number of already-computed levels, we cannot just write:
416		// assert(pyr->filled_levels >= n_levels);
417		// This function allows the check to be correctly written as:
418		// assert(aom_is_pyramid_valid(pyr, n_levels));
419		//
420		// Note: This deliberately does not restrict n_levels based on the maximum
421		// number of permitted levels for the frame size. This allows the check to
422		// catch cases where the caller forgets to handle the case where
423		// max_levels is less than the requested number of levels
424		bool aom_is_pyramid_valid(ImagePyramid *pyr, int n_levels) {
425		assert(pyr);
426
427		// Per the comments in the ImagePyramid struct, we must take this mutex
428		// before reading or writing the filled_levels field, to ensure proper
429		// behaviour when multithreading is used
430		#if CONFIG_MULTITHREAD
431		pthread_mutex_lock(&pyr->mutex);
432		#endif // CONFIG_MULTITHREAD
433
434		bool result = (pyr->filled_levels >= n_levels);
435
436		#if CONFIG_MULTITHREAD
437		pthread_mutex_unlock(&pyr->mutex);
438		#endif // CONFIG_MULTITHREAD
439
440		return result;
441		}
442		#endif
443
444		// Mark a pyramid as no longer containing valid data.
445		// This must be done whenever the corresponding frame buffer is reused
446	58.4k	void aom_invalidate_pyramid(ImagePyramid *pyr) {
447	58.4k	if (pyr) {
448	0	#if CONFIG_MULTITHREAD
449	0	pthread_mutex_lock(&pyr->mutex);
450	0	#endif // CONFIG_MULTITHREAD
451	0	pyr->filled_levels = 0;
452	0	#if CONFIG_MULTITHREAD
453	0	pthread_mutex_unlock(&pyr->mutex);
454	0	#endif // CONFIG_MULTITHREAD
455	0	}
456	58.4k	}
457
458		// Release the memory associated with a pyramid
459	0	void aom_free_pyramid(ImagePyramid *pyr) {
460	0	if (pyr) {
461	0	#if CONFIG_MULTITHREAD
462	0	pthread_mutex_destroy(&pyr->mutex);
463	0	#endif // CONFIG_MULTITHREAD
464	0	aom_free(pyr->buffer_alloc);
465	0	aom_free(pyr->layers);
466	0	aom_free(pyr);
467	0	}
468	0	}