/***************************************************************************** * Copyright (C) 2013-2020 MulticoreWare, Inc * * Authors: Deepthi Nandakumar * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02111, USA. * * This program is also available under a commercial proprietary license. * For more information, contact us at license @ x265.com *****************************************************************************/ #include "common.h" #include "yuv.h" #include "shortyuv.h" #include "primitives.h" #include "x265.h" using namespace X265_NS; ShortYuv::ShortYuv() { m_buf[0] = NULL; m_buf[1] = NULL; m_buf[2] = NULL; } bool ShortYuv::create(uint32_t size, int csp) { m_csp = csp; m_size = size; m_hChromaShift = CHROMA_H_SHIFT(csp); m_vChromaShift = CHROMA_V_SHIFT(csp); size_t sizeL = size * size; if (csp != X265_CSP_I400) { m_csize = size >> m_hChromaShift; size_t sizeC = sizeL >> (m_hChromaShift + m_vChromaShift); X265_CHECK((sizeC & 15) == 0, "invalid size"); CHECKED_MALLOC(m_buf[0], int16_t, sizeL + sizeC * 2); m_buf[1] = m_buf[0] + sizeL; m_buf[2] = m_buf[0] + sizeL + sizeC; } else { CHECKED_MALLOC(m_buf[0], int16_t, sizeL); m_buf[1] = m_buf[2] = NULL; } return true; fail: return false; } void ShortYuv::destroy() { X265_FREE(m_buf[0]); } void ShortYuv::clear() { memset(m_buf[0], 0, (m_size * m_size) * sizeof(int16_t)); memset(m_buf[1], 0, (m_csize * m_csize) * sizeof(int16_t)); memset(m_buf[2], 0, (m_csize * m_csize) * sizeof(int16_t)); } void ShortYuv::subtract(const Yuv& srcYuv0, const Yuv& srcYuv1, uint32_t log2Size, int picCsp) { const int sizeIdx = log2Size - 2; primitives.cu[sizeIdx].sub_ps(m_buf[0], m_size, srcYuv0.m_buf[0], srcYuv1.m_buf[0], srcYuv0.m_size, srcYuv1.m_size); if (m_csp != X265_CSP_I400 && picCsp != X265_CSP_I400) { primitives.chroma[m_csp].cu[sizeIdx].sub_ps(m_buf[1], m_csize, srcYuv0.m_buf[1], srcYuv1.m_buf[1], srcYuv0.m_csize, srcYuv1.m_csize); primitives.chroma[m_csp].cu[sizeIdx].sub_ps(m_buf[2], m_csize, srcYuv0.m_buf[2], srcYuv1.m_buf[2], srcYuv0.m_csize, srcYuv1.m_csize); } } void ShortYuv::copyPartToPartLuma(ShortYuv& dstYuv, uint32_t absPartIdx, uint32_t log2Size) const { const int16_t* src = getLumaAddr(absPartIdx); int16_t* dst = dstYuv.getLumaAddr(absPartIdx); primitives.cu[log2Size - 2].copy_ss(dst, dstYuv.m_size, src, m_size); } void ShortYuv::copyPartToPartLuma(Yuv& dstYuv, uint32_t absPartIdx, uint32_t log2Size) const { const int16_t* src = getLumaAddr(absPartIdx); pixel* dst = dstYuv.getLumaAddr(absPartIdx); primitives.cu[log2Size - 2].copy_sp(dst, dstYuv.m_size, src, m_size); } void ShortYuv::copyPartToPartChroma(ShortYuv& dstYuv, uint32_t absPartIdx, uint32_t log2SizeL) const { int part = partitionFromLog2Size(log2SizeL); const int16_t* srcU = getCbAddr(absPartIdx); const int16_t* srcV = getCrAddr(absPartIdx); int16_t* dstU = dstYuv.getCbAddr(absPartIdx); int16_t* dstV = dstYuv.getCrAddr(absPartIdx); primitives.chroma[m_csp].cu[part].copy_ss(dstU, dstYuv.m_csize, srcU, m_csize); primitives.chroma[m_csp].cu[part].copy_ss(dstV, dstYuv.m_csize, srcV, m_csize); } void ShortYuv::copyPartToPartChroma(Yuv& dstYuv, uint32_t absPartIdx, uint32_t log2SizeL) const { int part = partitionFromLog2Size(log2SizeL); const int16_t* srcU = getCbAddr(absPartIdx); const int16_t* srcV = getCrAddr(absPartIdx); pixel* dstU = dstYuv.getCbAddr(absPartIdx); pixel* dstV = dstYuv.getCrAddr(absPartIdx); primitives.chroma[m_csp].cu[part].copy_sp(dstU, dstYuv.m_csize, srcU, m_csize); primitives.chroma[m_csp].cu[part].copy_sp(dstV, dstYuv.m_csize, srcV, m_csize); }