Codebase list libde265 / upstream/1.0.8+git20210223.7d5aeb5 acceleration-speed / dct.cc
upstream/1.0.8+git20210223.7d5aeb5

Tree @upstream/1.0.8+git20210223.7d5aeb5 (Download .tar.gz)

dct.cc @upstream/1.0.8+git20210223.7d5aeb5raw · history · blame

/*
 * H.265 video codec.
 * Copyright (c) 2015 struktur AG, Dirk Farin <farin@struktur.de>
 *
 * This file is part of libde265.
 *
 * libde265 is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * libde265 is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with libde265.  If not, see <http://www.gnu.org/licenses/>.
 */

#include "dct.h"


// --- FDCT ---

void DSPFunc_FDCT_Base::dump(int x,int y)
{
  printf("-> ");
  for (int yy=0;yy<blkSize;yy++)
    for (int xx=0;xx<blkSize;xx++)
      printf("%d ", *(residuals+x+xx+(y+yy)*stride));
  printf("\n");

  printf("   ");
  for (int x=0;x<blkSize*blkSize;x++)
    printf("%d ", coeffs[x]);
  printf("\n");

  int32_t out[32*32];
  transform_idct_8x8_fallback(out, coeffs, 20-8, 15);

  printf("   ");
  for (int x=0;x<blkSize*blkSize;x++)
    printf("%d ", out[x]);
  printf("\n");
}


bool DSPFunc_FDCT_Base::compareToReferenceImplementation()
{
  DSPFunc_FDCT_Base* refImpl = dynamic_cast<DSPFunc_FDCT_Base*>(referenceImplementation());

  for (int i=0;i<blkSize*blkSize;i++)
    if (coeffs[i] != refImpl->coeffs[i])
      return false;

  return true;
}


bool DSPFunc_FDCT_Base::prepareNextImage(std::shared_ptr<const de265_image> img)
{
  if (!curr_image) {
    curr_image = img;
    return false;
  }

  prev_image = curr_image;
  curr_image = img;

  int w = curr_image->get_width(0);
  int h = curr_image->get_height(0);

  if (residuals==NULL) {
    int align=16;
    stride = (w+align-1)/align*align;
    residuals = new int16_t[stride*h];
  }

  int cstride = curr_image->get_luma_stride();
  int pstride = prev_image->get_luma_stride();
  const uint8_t* curr = curr_image->get_image_plane_at_pos(0,0,0);
  const uint8_t* prev = prev_image->get_image_plane_at_pos(0,0,0);

  for (int y=0;y<h;y++)
    for (int x=0;x<w;x++) {
      residuals[y*stride+x] = curr[y*cstride+x] - prev[y*pstride+x];
    }

  return true;
}


// --- IDCT ---

bool DSPFunc_IDCT_Base::compareToReferenceImplementation()
{
  DSPFunc_IDCT_Base* refImpl = dynamic_cast<DSPFunc_IDCT_Base*>(referenceImplementation());

  for (int i=0;i<blkSize*blkSize;i++)
    if (out[i] != refImpl->out[i])
      return false;

  return true;
}


bool DSPFunc_IDCT_Base::prepareNextImage(std::shared_ptr<const de265_image> img)
{
  // --- generate fake coefficients ---
  // difference between two frames

  if (!curr_image) {
    curr_image = img;
    return false;
  }

  prev_image = curr_image;
  curr_image = img;

  int w = curr_image->get_width(0);
  int h = curr_image->get_height(0);

  int align = blkSize;
  width = (w+align-1) / align * align;

  blksPerRow = w/blkSize;

  if (coeffs==NULL) {
    coeffs = new int16_t[width*h];
  }

  int cstride = curr_image->get_luma_stride();
  int pstride = prev_image->get_luma_stride();
  const uint8_t* curr = curr_image->get_image_plane_at_pos(0,0,0);
  const uint8_t* prev = prev_image->get_image_plane_at_pos(0,0,0);

  for (int y=0;y<h;y++)
    for (int x=0;x<w;x++) {
      coeffs[y*w+x] = curr[y*cstride+x] - prev[y*pstride+x];
    }

  return true;
}