Skip to content
Snippets Groups Projects
IntraSearch.cpp 322 KiB
Newer Older
  • Learn to ignore specific revisions
  • /* The copyright in this software is being made available under the BSD
     * License, included below. This software may be subject to other third party
     * and contributor rights, including patent rights, and no such rights are
     * granted under this license.
     *
    
     * Copyright (c) 2010-2022, ITU/ISO/IEC
    
     * All rights reserved.
     *
     * Redistribution and use in source and binary forms, with or without
     * modification, are permitted provided that the following conditions are met:
     *
     *  * Redistributions of source code must retain the above copyright notice,
     *    this list of conditions and the following disclaimer.
     *  * Redistributions in binary form must reproduce the above copyright notice,
     *    this list of conditions and the following disclaimer in the documentation
     *    and/or other materials provided with the distribution.
     *  * Neither the name of the ITU/ISO/IEC nor the names of its contributors may
     *    be used to endorse or promote products derived from this software without
     *    specific prior written permission.
     *
     * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
     * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
     * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS
     * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF
     * THE POSSIBILITY OF SUCH DAMAGE.
     */
    
    /** \file     EncSearch.cpp
     *  \brief    encoder intra search class
     */
    
    #include "IntraSearch.h"
    
    #include "EncModeCtrl.h"
    
    #include "CommonLib/CommonDef.h"
    #include "CommonLib/Rom.h"
    #include "CommonLib/Picture.h"
    #include "CommonLib/UnitTools.h"
    
    #if JVET_V0094_BILATERAL_FILTER || JVET_X0071_CHROMA_BILATERAL_FILTER
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #include "CommonLib/BilateralFilter.h"
    #endif
    
    
    #include "CommonLib/dtrace_next.h"
    #include "CommonLib/dtrace_buffer.h"
    
    #include <math.h>
    #include <limits>
     //! \ingroup EncoderLib
     //! \{
    
    IntraSearch::IntraSearch()
      : m_pSplitCS      (nullptr)
      , m_pFullCS       (nullptr)
      , m_pBestCS       (nullptr)
      , m_pcEncCfg      (nullptr)
    
    #if JVET_V0094_BILATERAL_FILTER || JVET_X0071_CHROMA_BILATERAL_FILTER
    
    Vadim Seregin's avatar
    Vadim Seregin committed
      , m_bilateralFilter(nullptr)
    #endif
    
      , m_pcTrQuant     (nullptr)
      , m_pcRdCost      (nullptr)
    
    Taoran Lu's avatar
    Taoran Lu committed
      , m_pcReshape     (nullptr)
    
      , m_CABACEstimator(nullptr)
      , m_CtxCache      (nullptr)
      , m_isInitialized (false)
    {
      for( uint32_t ch = 0; ch < MAX_NUM_TBLOCKS; ch++ )
      {
        m_pSharedPredTransformSkip[ch] = nullptr;
      }
    
    fan wang's avatar
    fan wang committed
    #if JVET_AB0155_SGPM
      for (int i = 0; i < NUM_LUMA_MODE; i++)
      {
        m_intraPredBuf[i] = nullptr;
      }
      for (int i = 0; i < SGPM_NUM; i++)
      {
        m_sgpmPredBuf[i] = nullptr;
      }
    #endif
    
    
      m_truncBinBits = nullptr;
      m_escapeNumBins = nullptr;
      m_minErrorIndexMap = nullptr;
      for (unsigned i = 0; i < (MAXPLTSIZE + 1); i++)
      {
        m_indexError[i] = nullptr;
      }
      for (unsigned i = 0; i < NUM_TRELLIS_STATE; i++)
      {
        m_statePtRDOQ[i] = nullptr;
      }
    
    }
    
    
    void IntraSearch::destroy()
    {
      CHECK( !m_isInitialized, "Not initialized" );
    
      if( m_pcEncCfg )
      {
    
    Karsten Suehring's avatar
    Karsten Suehring committed
        const uint32_t uiNumLayersToAllocateSplit = 1;
        const uint32_t uiNumLayersToAllocateFull  = 1;
    
        const int uiNumSaveLayersToAllocate = 2;
    
        for( uint32_t layer = 0; layer < uiNumSaveLayersToAllocate; layer++ )
        {
          m_pSaveCS[layer]->destroy();
          delete m_pSaveCS[layer];
        }
    
        uint32_t numWidths  = gp_sizeIdxInfo->numWidths();
        uint32_t numHeights = gp_sizeIdxInfo->numHeights();
    
        for( uint32_t width = 0; width < numWidths; width++ )
        {
          for( uint32_t height = 0; height < numHeights; height++ )
          {
    
    Karsten Suehring's avatar
    Karsten Suehring committed
            if( gp_sizeIdxInfo->isCuSize( gp_sizeIdxInfo->sizeFrom( width ) ) && gp_sizeIdxInfo->isCuSize( gp_sizeIdxInfo->sizeFrom( height ) ) )
    
            {
              for( uint32_t layer = 0; layer < uiNumLayersToAllocateSplit; layer++ )
              {
                m_pSplitCS[width][height][layer]->destroy();
    
                delete m_pSplitCS[width][height][layer];
              }
    
              for( uint32_t layer = 0; layer < uiNumLayersToAllocateFull; layer++ )
              {
                m_pFullCS[width][height][layer]->destroy();
    
                delete m_pFullCS[width][height][layer];
              }
    
              delete[] m_pSplitCS[width][height];
              delete[] m_pFullCS [width][height];
    
              m_pBestCS[width][height]->destroy();
              m_pTempCS[width][height]->destroy();
    
              delete m_pTempCS[width][height];
              delete m_pBestCS[width][height];
            }
          }
    
          delete[] m_pSplitCS[width];
          delete[] m_pFullCS [width];
    
          delete[] m_pTempCS[width];
          delete[] m_pBestCS[width];
        }
    
        delete[] m_pSplitCS;
        delete[] m_pFullCS;
    
        delete[] m_pBestCS;
        delete[] m_pTempCS;
    
        delete[] m_pSaveCS;
      }
    
      m_pSplitCS = m_pFullCS = nullptr;
    
      m_pBestCS = m_pTempCS = nullptr;
    
      m_pSaveCS = nullptr;
    
      for( uint32_t ch = 0; ch < MAX_NUM_TBLOCKS; ch++ )
      {
        delete[] m_pSharedPredTransformSkip[ch];
        m_pSharedPredTransformSkip[ch] = nullptr;
      }
    
    
    #if JVET_AB0143_CCCM_TS
    
    Vadim Seregin's avatar
    Vadim Seregin committed
      for (uint32_t cccmIdx = 0; cccmIdx < CCCM_NUM_MODES; cccmIdx++)
    
      {
        m_cccmStorage[cccmIdx].destroy();
      }
    #endif
    
    
    Taoran Lu's avatar
    Taoran Lu committed
      m_tmpStorageLCU.destroy();
    
      m_colorTransResiBuf.destroy();
    
    fan wang's avatar
    fan wang committed
      
    #if JVET_AB0155_SGPM
      for (int i = 0; i < NUM_LUMA_MODE; i++)
      {
        delete[] m_intraPredBuf[i];
        m_intraPredBuf[i] = nullptr;
      }
    
      for (int i = 0; i < SGPM_NUM; i++)
      {
        delete[] m_sgpmPredBuf[i];
        m_sgpmPredBuf[i] = nullptr;
      }
    #endif
    
    
      if (m_truncBinBits != nullptr)
      {
        for (unsigned i = 0; i < m_symbolSize; i++)
        {
          delete[] m_truncBinBits[i];
          m_truncBinBits[i] = nullptr;
        }
        delete[] m_truncBinBits;
        m_truncBinBits = nullptr;
      }
      if (m_escapeNumBins != nullptr)
      {
        delete[] m_escapeNumBins;
        m_escapeNumBins = nullptr;
      }
      if (m_indexError[0] != nullptr)
      {
        for (unsigned i = 0; i < (MAXPLTSIZE + 1); i++)
        {
          delete[] m_indexError[i];
          m_indexError[i] = nullptr;
        }
      }
      if (m_minErrorIndexMap != nullptr)
      {
        delete[] m_minErrorIndexMap;
        m_minErrorIndexMap = nullptr;
      }
      if (m_statePtRDOQ[0] != nullptr)
      {
        for (unsigned i = 0; i < NUM_TRELLIS_STATE; i++)
        {
          delete[] m_statePtRDOQ[i];
          m_statePtRDOQ[i] = nullptr;
        }
      }
    
    }
    
    IntraSearch::~IntraSearch()
    {
      if( m_isInitialized )
      {
        destroy();
      }
    }
    
    void IntraSearch::init( EncCfg*        pcEncCfg,
    
    #if JVET_V0094_BILATERAL_FILTER || JVET_X0071_CHROMA_BILATERAL_FILTER
    
    Vadim Seregin's avatar
    Vadim Seregin committed
                           BilateralFilter* bilateralFilter,
    #endif
    
                            TrQuant*       pcTrQuant,
                            RdCost*        pcRdCost,
                            CABACWriter*   CABACEstimator,
                            CtxCache*      ctxCache,
                            const uint32_t     maxCUWidth,
                            const uint32_t     maxCUHeight,
                            const uint32_t     maxTotalCUDepth
    
    Taoran Lu's avatar
    Taoran Lu committed
                           , EncReshape*   pcReshape
    
                           , const unsigned bitDepthY
    
    )
    {
      CHECK(m_isInitialized, "Already initialized");
      m_pcEncCfg                     = pcEncCfg;
    
    #if JVET_V0094_BILATERAL_FILTER || JVET_X0071_CHROMA_BILATERAL_FILTER
    
    Vadim Seregin's avatar
    Vadim Seregin committed
      m_bilateralFilter              = bilateralFilter;
    #endif
    
      m_pcTrQuant                    = pcTrQuant;
      m_pcRdCost                     = pcRdCost;
      m_CABACEstimator               = CABACEstimator;
      m_CtxCache                     = ctxCache;
    
    Taoran Lu's avatar
    Taoran Lu committed
      m_pcReshape                    = pcReshape;
    
    
      const ChromaFormat cform = pcEncCfg->getChromaFormatIdc();
    
      IntraPrediction::init( cform, pcEncCfg->getBitDepth( CHANNEL_TYPE_LUMA ) );
    
    Taoran Lu's avatar
    Taoran Lu committed
      m_tmpStorageLCU.create(UnitArea(cform, Area(0, 0, MAX_CU_SIZE, MAX_CU_SIZE)));
    
      m_colorTransResiBuf.create(UnitArea(cform, Area(0, 0, MAX_CU_SIZE, MAX_CU_SIZE)));
    
    #if JVET_AB0143_CCCM_TS
    
    Vadim Seregin's avatar
    Vadim Seregin committed
      for (uint32_t cccmIdx = 0; cccmIdx < CCCM_NUM_MODES; cccmIdx++)
    
      {
        m_cccmStorage[cccmIdx].create(UnitArea(cform, Area(0, 0, MAX_CU_SIZE, MAX_CU_SIZE)));
      }
    #endif
    
    fan wang's avatar
    fan wang committed
    #if JVET_AB0155_SGPM
      for (int i = 0; i < NUM_LUMA_MODE; i++)
      {
        m_intraPredBuf[i] = new Pel[GEO_MAX_CU_SIZE_EX * GEO_MAX_CU_SIZE_EX];
      }
      for (int i = 0; i < SGPM_NUM; i++)
      {
        m_sgpmPredBuf[i] = new Pel[GEO_MAX_CU_SIZE_EX * GEO_MAX_CU_SIZE_EX];
      }
    #endif
    
      for( uint32_t ch = 0; ch < MAX_NUM_TBLOCKS; ch++ )
      {
        m_pSharedPredTransformSkip[ch] = new Pel[MAX_CU_SIZE * MAX_CU_SIZE];
      }
    
      uint32_t numWidths  = gp_sizeIdxInfo->numWidths();
      uint32_t numHeights = gp_sizeIdxInfo->numHeights();
    
    
    Karsten Suehring's avatar
    Karsten Suehring committed
      const uint32_t uiNumLayersToAllocateSplit = 1;
      const uint32_t uiNumLayersToAllocateFull  = 1;
    
    
      m_pBestCS = new CodingStructure**[numWidths];
      m_pTempCS = new CodingStructure**[numWidths];
    
      m_pFullCS  = new CodingStructure***[numWidths];
      m_pSplitCS = new CodingStructure***[numWidths];
    
      for( uint32_t width = 0; width < numWidths; width++ )
      {
        m_pBestCS[width] = new CodingStructure*[numHeights];
        m_pTempCS[width] = new CodingStructure*[numHeights];
    
        m_pFullCS [width] = new CodingStructure**[numHeights];
        m_pSplitCS[width] = new CodingStructure**[numHeights];
    
        for( uint32_t height = 0; height < numHeights; height++ )
        {
    
    Karsten Suehring's avatar
    Karsten Suehring committed
          if(  gp_sizeIdxInfo->isCuSize( gp_sizeIdxInfo->sizeFrom( width ) ) && gp_sizeIdxInfo->isCuSize( gp_sizeIdxInfo->sizeFrom( height ) ) )
    
          {
            m_pBestCS[width][height] = new CodingStructure( m_unitCache.cuCache, m_unitCache.puCache, m_unitCache.tuCache );
            m_pTempCS[width][height] = new CodingStructure( m_unitCache.cuCache, m_unitCache.puCache, m_unitCache.tuCache );
    
    
    Seungwook Hong's avatar
    Seungwook Hong committed
    #if JVET_Z0118_GDR
            m_pBestCS[width][height]->create(m_pcEncCfg->getChromaFormatIdc(), Area(0, 0, gp_sizeIdxInfo->sizeFrom(width), gp_sizeIdxInfo->sizeFrom(height)), false, (bool)pcEncCfg->getPLTMode(), pcEncCfg->getGdrEnabled());
            m_pTempCS[width][height]->create(m_pcEncCfg->getChromaFormatIdc(), Area(0, 0, gp_sizeIdxInfo->sizeFrom(width), gp_sizeIdxInfo->sizeFrom(height)), false, (bool)pcEncCfg->getPLTMode(), pcEncCfg->getGdrEnabled());
    #else
    
            m_pBestCS[width][height]->create(m_pcEncCfg->getChromaFormatIdc(), Area(0, 0, gp_sizeIdxInfo->sizeFrom(width), gp_sizeIdxInfo->sizeFrom(height)), false, (bool)pcEncCfg->getPLTMode());
            m_pTempCS[width][height]->create(m_pcEncCfg->getChromaFormatIdc(), Area(0, 0, gp_sizeIdxInfo->sizeFrom(width), gp_sizeIdxInfo->sizeFrom(height)), false, (bool)pcEncCfg->getPLTMode());
    
    Seungwook Hong's avatar
    Seungwook Hong committed
    #endif
    
            m_pFullCS [width][height] = new CodingStructure*[uiNumLayersToAllocateFull];
            m_pSplitCS[width][height] = new CodingStructure*[uiNumLayersToAllocateSplit];
    
            for( uint32_t layer = 0; layer < uiNumLayersToAllocateFull; layer++ )
            {
              m_pFullCS [width][height][layer] = new CodingStructure( m_unitCache.cuCache, m_unitCache.puCache, m_unitCache.tuCache );
    
    
    Seungwook Hong's avatar
    Seungwook Hong committed
    #if JVET_Z0118_GDR
              m_pFullCS[width][height][layer]->create(m_pcEncCfg->getChromaFormatIdc(), Area(0, 0, gp_sizeIdxInfo->sizeFrom(width), gp_sizeIdxInfo->sizeFrom(height)), false, (bool)pcEncCfg->getPLTMode(), pcEncCfg->getGdrEnabled());
    #else
    
              m_pFullCS[width][height][layer]->create(m_pcEncCfg->getChromaFormatIdc(), Area(0, 0, gp_sizeIdxInfo->sizeFrom(width), gp_sizeIdxInfo->sizeFrom(height)), false, (bool)pcEncCfg->getPLTMode());
    
    Seungwook Hong's avatar
    Seungwook Hong committed
    #endif
    
            }
    
            for( uint32_t layer = 0; layer < uiNumLayersToAllocateSplit; layer++ )
            {
              m_pSplitCS[width][height][layer] = new CodingStructure( m_unitCache.cuCache, m_unitCache.puCache, m_unitCache.tuCache );
    
    Seungwook Hong's avatar
    Seungwook Hong committed
    #if JVET_Z0118_GDR
              m_pSplitCS[width][height][layer]->create(m_pcEncCfg->getChromaFormatIdc(), Area(0, 0, gp_sizeIdxInfo->sizeFrom(width), gp_sizeIdxInfo->sizeFrom(height)), false, (bool)pcEncCfg->getPLTMode(), pcEncCfg->getGdrEnabled());
    #else
    
              m_pSplitCS[width][height][layer]->create(m_pcEncCfg->getChromaFormatIdc(), Area(0, 0, gp_sizeIdxInfo->sizeFrom(width), gp_sizeIdxInfo->sizeFrom(height)), false, (bool)pcEncCfg->getPLTMode());
    
    Seungwook Hong's avatar
    Seungwook Hong committed
    #endif
    
            }
          }
          else
          {
            m_pBestCS[width][height] = nullptr;
            m_pTempCS[width][height] = nullptr;
    
            m_pFullCS [width][height] = nullptr;
            m_pSplitCS[width][height] = nullptr;
          }
        }
      }
    
      const int uiNumSaveLayersToAllocate = 2;
    
      m_pSaveCS = new CodingStructure*[uiNumSaveLayersToAllocate];
    
      for( uint32_t depth = 0; depth < uiNumSaveLayersToAllocate; depth++ )
      {
        m_pSaveCS[depth] = new CodingStructure( m_unitCache.cuCache, m_unitCache.puCache, m_unitCache.tuCache );
    
    Seungwook Hong's avatar
    Seungwook Hong committed
    #if JVET_Z0118_GDR
        m_pSaveCS[depth]->create(UnitArea(cform, Area(0, 0, maxCUWidth, maxCUHeight)), false, (bool)pcEncCfg->getPLTMode(), pcEncCfg->getGdrEnabled());
    #else
    
        m_pSaveCS[depth]->create(UnitArea(cform, Area(0, 0, maxCUWidth, maxCUHeight)), false, (bool)pcEncCfg->getPLTMode());
    
    Seungwook Hong's avatar
    Seungwook Hong committed
    #endif
    
      if (pcEncCfg->getPLTMode())
    
        m_symbolSize = (1 << bitDepthY); // pixel values are within [0, SymbolSize-1] with size SymbolSize
        if (m_truncBinBits == nullptr)
    
          m_truncBinBits = new uint16_t*[m_symbolSize];
          for (unsigned i = 0; i < m_symbolSize; i++)
          {
            m_truncBinBits[i] = new uint16_t[m_symbolSize + 1];
          }
    
        if (m_escapeNumBins == nullptr)
    
          m_escapeNumBins = new uint16_t[m_symbolSize];
    
        initTBCTable(bitDepthY);
        if (m_indexError[0] == nullptr)
    
          for (unsigned i = 0; i < (MAXPLTSIZE + 1); i++)
          {
            m_indexError[i] = new double[MAX_CU_BLKSIZE_PLT*MAX_CU_BLKSIZE_PLT];
          }
        }
        if (m_minErrorIndexMap == nullptr)
        {
          m_minErrorIndexMap = new uint8_t[MAX_CU_BLKSIZE_PLT*MAX_CU_BLKSIZE_PLT];
        }
        if (m_statePtRDOQ[0] == nullptr)
        {
          for (unsigned i = 0; i < NUM_TRELLIS_STATE; i++)
          {
            m_statePtRDOQ[i] = new uint8_t[MAX_CU_BLKSIZE_PLT*MAX_CU_BLKSIZE_PLT];
          }
    
    #if INTRA_TRANS_ENC_OPT
      m_skipTimdLfnstMtsPass = false;
    #endif
    
    }
    
    
    //////////////////////////////////////////////////////////////////////////
    // INTRA PREDICTION
    //////////////////////////////////////////////////////////////////////////
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if !INTRA_RM_SMALL_BLOCK_SIZE_CONSTRAINTS
    
    static constexpr double COST_UNKNOWN = -65536.0;
    
    
    double IntraSearch::findInterCUCost( CodingUnit &cu )
    {
      if( cu.isConsIntra() && !cu.slice->isIntra() )
      {
        //search corresponding inter CU cost
        for( int i = 0; i < m_numCuInSCIPU; i++ )
        {
          if( cu.lumaPos() == m_cuAreaInSCIPU[i].pos() && cu.lumaSize() == m_cuAreaInSCIPU[i].size() )
          {
            return m_cuCostInSCIPU[i];
          }
        }
      }
      return COST_UNKNOWN;
    }
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #endif
    
    #if JVET_W0103_INTRA_MTS
    bool IntraSearch::testISPforCurrCU(const CodingUnit &cu)
    {
      CodingStructure       &cs = *cu.cs;
      auto &pu = *cu.firstPU;
      const CompArea &area = pu.Y();
      PelBuf piOrg = cs.getOrgBuf(area);
    
      Pel* pOrg = piOrg.buf;
      int uiWidth = area.width;
      int uiHeight = area.height;
      int iStride = piOrg.stride;
      int Gsum = 0;
      int nPix = (uiWidth - 2) * (uiHeight - 2);
      for (int y = 1; y < (uiHeight - 1); y++)
      {
        for (int x = 1; x < (uiWidth - 1); x++)
        {
          const Pel *p = pOrg + y * iStride + x;
    
          int iDy = p[-iStride - 1] + 2 * p[-1] + p[iStride - 1] - p[-iStride + 1] - 2 * p[+1] - p[iStride + 1];
          int iDx = p[iStride - 1] + 2 * p[iStride] + p[iStride + 1] - p[-iStride - 1] - 2 * p[-iStride] - p[-iStride + 1];
    
          if (iDy == 0 && iDx == 0)
            continue;
    
          int iAmp = (int)(abs(iDx) + abs(iDy));
          Gsum += iAmp;
        }
      }
      Gsum = (Gsum + (nPix >> 1)) / nPix;
    
      bool testISP = true;
      CHECK(m_numModesISPRDO != -1, "m_numModesISPRDO!=-1");
    
      m_numModesISPRDO = (Gsum < 50 && uiWidth >= 16 && uiHeight >= 16) ? 1 : 2;
      return testISP;
    }
    #endif
    
    bool IntraSearch::estIntraPredLumaQT(CodingUnit &cu, Partitioner &partitioner, const double bestCostSoFar, bool mtsCheckRangeFlag, int mtsFirstCheckId, int mtsLastCheckId, bool moreProbMTSIdxFirst, CodingStructure* bestCS)
    
    {
      CodingStructure       &cs            = *cu.cs;
      const SPS             &sps           = *cs.sps;
    
      const uint32_t             uiWidthBit    = floorLog2(partitioner.currArea().lwidth() );
      const uint32_t             uiHeightBit   =                   floorLog2(partitioner.currArea().lheight());
    
    
      // Lambda calculation at equivalent Qp of 4 is recommended because at that Qp, the quantization divisor is 1.
    
      const double sqrtLambdaForFirstPass = m_pcRdCost->getMotionLambda( ) * FRAC_BITS_SCALE;
    
    
      //===== loop over partitions =====
    
      const TempCtx ctxStart          ( m_CtxCache, m_CABACEstimator->getCtx() );
    
      const TempCtx ctxStartMipFlag    ( m_CtxCache, SubCtx( Ctx::MipFlag,          m_CABACEstimator->getCtx() ) );
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if JVET_V0130_INTRA_TMP
    
    Vadim Seregin's avatar
    Vadim Seregin committed
      const TempCtx ctxStartTpmFlag(m_CtxCache, SubCtx(Ctx::TmpFlag, m_CABACEstimator->getCtx()));
    
    Keming Cao's avatar
    Keming Cao committed
    #endif
    #if JVET_W0123_TIMD_FUSION
      const TempCtx ctxStartTimdFlag   ( m_CtxCache, SubCtx( Ctx::TimdFlag,      m_CABACEstimator->getCtx() ) );
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #endif
    
    fan wang's avatar
    fan wang committed
    #if JVET_AB0155_SGPM
      const TempCtx ctxStartSgpmFlag(m_CtxCache, SubCtx(Ctx::SgpmFlag, m_CABACEstimator->getCtx()));
    #endif
    
    
      const TempCtx ctxStartIspMode    ( m_CtxCache, SubCtx( Ctx::ISPMode,          m_CABACEstimator->getCtx() ) );
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if SECONDARY_MPM
      const TempCtx ctxStartMPMIdxFlag(m_CtxCache, SubCtx(Ctx::IntraLumaMPMIdx, m_CABACEstimator->getCtx()));
    #endif
    
      const TempCtx ctxStartPlanarFlag ( m_CtxCache, SubCtx( Ctx::IntraLumaPlanarFlag, m_CABACEstimator->getCtx() ) );
    
    Frank Bossen's avatar
    Frank Bossen committed
      const TempCtx ctxStartIntraMode(m_CtxCache, SubCtx(Ctx::IntraLumaMpmFlag, m_CABACEstimator->getCtx()));
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if SECONDARY_MPM
      const TempCtx ctxStartIntraMode2(m_CtxCache, SubCtx(Ctx::IntraLumaSecondMpmFlag, m_CABACEstimator->getCtx()));
    #endif
    
    Paul Keydel's avatar
    Paul Keydel committed
      const TempCtx ctxStartMrlIdx      ( m_CtxCache, SubCtx( Ctx::MultiRefLineIdx,        m_CABACEstimator->getCtx() ) );
    
    #if JVET_AB0157_TMRL
      const TempCtx ctxStartTmrlDerive    (m_CtxCache, SubCtx(Ctx::TmrlDerive, m_CABACEstimator->getCtx()));
    #endif
    
      // variables for saving fast intra modes scan results across multiple LFNST passes
      bool LFNSTLoadFlag = sps.getUseLFNST() && cu.lfnstIdx != 0;
      bool LFNSTSaveFlag = sps.getUseLFNST() && cu.lfnstIdx == 0;
    
      LFNSTSaveFlag &= sps.getUseIntraMTS() ? cu.mtsFlag == 0 : true;
    
    fan wang's avatar
    fan wang committed
    #if JVET_AB0155_SGPM
    
    fan wang's avatar
    fan wang committed
      bool SGPMSaveFlag = (cu.lfnstIdx == 0 && cu.mtsFlag == 0);
    
    fan wang's avatar
    fan wang committed
    #endif
    
    
      const uint32_t lfnstIdx = cu.lfnstIdx;
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if !INTRA_RM_SMALL_BLOCK_SIZE_CONSTRAINTS
    
      double costInterCU = findInterCUCost( cu );
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #endif
    
      const int width  = partitioner.currArea().lwidth();
      const int height = partitioner.currArea().lheight();
    
      // Marking MTS usage for faster MTS
      // 0: MTS is either not applicable for current CU (cuWidth > MTS_INTRA_MAX_CU_SIZE or cuHeight > MTS_INTRA_MAX_CU_SIZE), not active in the config file or the fast decision algorithm is not used in this case
      // 1: MTS fast algorithm can be applied for the current CU, and the DCT2 is being checked
      // 2: MTS is being checked for current CU. Stored results of DCT2 can be utilized for speedup
      uint8_t mtsUsageFlag = 0;
      const int maxSizeEMT = MTS_INTRA_MAX_CU_SIZE;
      if( width <= maxSizeEMT && height <= maxSizeEMT && sps.getUseIntraMTS() )
      {
        mtsUsageFlag = ( sps.getUseLFNST() && cu.mtsFlag == 1 ) ? 2 : 1;
      }
    
      if( width * height < 64 && !m_pcEncCfg->getUseFastLFNST() )
      {
        mtsUsageFlag = 0;
      }
    
    #if JVET_W0103_INTRA_MTS
      if (!cu.mtsFlag && !cu.lfnstIdx)
      {
        m_globalBestCostStore = MAX_DOUBLE;
        m_globalBestCostValid = false;
        if (bestCS->getCU(partitioner.chType) != NULL && bestCS->getCU(partitioner.chType)->predMode != MODE_INTRA && bestCostSoFar != MAX_DOUBLE)
        {
          m_globalBestCostStore = bestCostSoFar;
          m_globalBestCostValid = true;
        }
    
    #if JVET_Y0142_ADAPT_INTRA_MTS
        m_modesForMTS.clear();
        m_modesCoeffAbsSumDCT2.clear();
    #endif
    
      const bool colorTransformIsEnabled = sps.getUseColorTrans() && !CS::isDualITree(cs);
      const bool isFirstColorSpace       = colorTransformIsEnabled && ((m_pcEncCfg->getRGBFormatFlag() && cu.colorTransform) || (!m_pcEncCfg->getRGBFormatFlag() && !cu.colorTransform));
      const bool isSecondColorSpace      = colorTransformIsEnabled && ((m_pcEncCfg->getRGBFormatFlag() && !cu.colorTransform) || (!m_pcEncCfg->getRGBFormatFlag() && cu.colorTransform));
    
      bool ispCanBeUsed   = sps.getUseISP() && cu.mtsFlag == 0 && cu.lfnstIdx == 0 && CU::canUseISP(width, height, cu.cs->sps->getMaxTbSize());
      bool saveDataForISP = ispCanBeUsed && (!colorTransformIsEnabled || isFirstColorSpace);
      bool testISP        = ispCanBeUsed && (!colorTransformIsEnabled || !cu.colorTransform);
    
    fan wang's avatar
    fan wang committed
    
    #if JVET_AB0155_SGPM
      const bool sgpmAllowed = sps.getUseSgpm() && isLuma(partitioner.chType);
      bool testSgpm = sgpmAllowed && cu.lwidth() >= GEO_MIN_CU_SIZE_EX && cu.lheight() >= GEO_MIN_CU_SIZE_EX
                      && cu.lwidth() <= GEO_MAX_CU_SIZE_EX && cu.lheight() <= GEO_MAX_CU_SIZE_EX
                      && cu.lwidth() < 8 * cu.lheight() && cu.lheight() < 8 * cu.lwidth() && cu.lx() && cu.ly()
                      && cu.lwidth() * cu.lheight() >= SGPM_MIN_PIX;
    #endif
    
    
    #if JVET_W0103_INTRA_MTS 
      if (testISP && m_pcEncCfg->getUseFastISP())
      {
        m_numModesISPRDO = -1;
        testISP &= testISPforCurrCU(cu);
      }
    #endif
    
      if ( saveDataForISP )
    
        //reset the intra modes lists variables
        m_ispCandListHor.clear();
        m_ispCandListVer.clear();
    
        //reset the variables used for the tests
    
        m_regIntraRDListWithCosts.clear();
    
        int numTotalPartsHor = (int)width  >> floorLog2(CU::getISPSplitDim(width, height, TU_1D_VERT_SPLIT));
        int numTotalPartsVer = (int)height >> floorLog2(CU::getISPSplitDim(width, height, TU_1D_HORZ_SPLIT));
    
        m_ispTestedModes[0].init( numTotalPartsHor, numTotalPartsVer );
        //the total number of subpartitions is modified to take into account the cases where LFNST cannot be combined with ISP due to size restrictions
        numTotalPartsHor = sps.getUseLFNST() && CU::canUseLfnstWithISP(cu.Y(), HOR_INTRA_SUBPARTITIONS) ? numTotalPartsHor : 0;
        numTotalPartsVer = sps.getUseLFNST() && CU::canUseLfnstWithISP(cu.Y(), VER_INTRA_SUBPARTITIONS) ? numTotalPartsVer : 0;
        for (int j = 1; j < NUM_LFNST_NUM_PER_SET; j++)
        {
          m_ispTestedModes[j].init(numTotalPartsHor, numTotalPartsVer);
        }
    
    #if INTRA_TRANS_ENC_OPT
      double regAngCost = MAX_DOUBLE;
      bool setSkipTimdControl = (m_pcEncCfg->getIntraPeriod() == 1) && !cu.lfnstIdx && !cu.mtsFlag;
      double timdAngCost = MAX_DOUBLE;
    #endif
    
      const bool testBDPCM = sps.getBDPCMEnabledFlag() && CU::bdpcmAllowed(cu, ComponentID(partitioner.chType)) && cu.mtsFlag == 0 && cu.lfnstIdx == 0;
    
      static_vector<ModeInfo, FAST_UDI_MAX_RDMODE_NUM> uiHadModeList;
    
      static_vector<double, FAST_UDI_MAX_RDMODE_NUM> CandCostList;
      static_vector<double, FAST_UDI_MAX_RDMODE_NUM> CandHadList;
    
      auto &pu = *cu.firstPU;
    
      bool validReturn = false;
    
      {
        CandHadList.clear();
        CandCostList.clear();
        uiHadModeList.clear();
    
        CHECK(pu.cu != &cu, "PU is not contained in the CU");
    
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if SECONDARY_MPM
        std::memcpy( pu.intraMPM, m_mpmList, sizeof( pu.intraMPM ) );
        std::memcpy( pu.intraNonMPM, m_nonMPMList, sizeof( pu.intraNonMPM ) );
    #endif
    
    
        //===== determine set of modes to be tested (using prediction signal only) =====
        int numModesAvailable = NUM_LUMA_MODE; // total number of Intra modes
    
        const bool fastMip    = sps.getUseMIP() && m_pcEncCfg->getUseFastMIP();
    
        const bool mipAllowed = sps.getUseMIP() && isLuma(partitioner.chType) && ((cu.lfnstIdx == 0) || allowLfnstWithMip(cu.firstPU->lumaSize()));
    
        const bool testMip = mipAllowed && !(cu.lwidth() > (8 * cu.lheight()) || cu.lheight() > (8 * cu.lwidth()));
    
        const bool supportedMipBlkSize = pu.lwidth() <= MIP_MAX_WIDTH && pu.lheight() <= MIP_MAX_HEIGHT;
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if JVET_V0130_INTRA_TMP
        const bool tpmAllowed = sps.getUseIntraTMP() && isLuma(partitioner.chType) && ((cu.lfnstIdx == 0) || allowLfnstWithTmp());
        const bool testTpm = tpmAllowed && (cu.lwidth() <= sps.getIntraTMPMaxSize() && cu.lheight() <= sps.getIntraTMPMaxSize());
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #endif
    
    
        static_vector<ModeInfo, FAST_UDI_MAX_RDMODE_NUM> uiRdModeList;
    
    Karsten Suehring's avatar
    Karsten Suehring committed
        numModesForFullRD = g_aucIntraModeNumFast_UseMPM_2D[uiWidthBit - MIN_CU_LOG2][uiHeightBit - MIN_CU_LOG2];
    
    
    #if INTRA_FULL_SEARCH
        numModesForFullRD = numModesAvailable;
    #endif
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if ENABLE_DIMD
        bool bestDimdMode = false;
    
    Keming Cao's avatar
    Keming Cao committed
    #endif
    #if JVET_W0123_TIMD_FUSION
        bool bestTimdMode = false;
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #endif
    
    #if JVET_AC0105_DIRECTIONAL_PLANAR
        uint8_t bestPlMode = 0;
    #endif
    
    fan wang's avatar
    fan wang committed
    #if JVET_AB0155_SGPM
        bool bestSgpmMode = false;
        const CompArea &area = pu.Y();
        CompArea tmpArea(COMPONENT_Y, area.chromaFormat, Position(0, 0), area.size());
    #endif
    
    
        if (isSecondColorSpace)
        {
          uiRdModeList.clear();
          if (m_numSavedRdModeFirstColorSpace[m_savedRdModeIdx] > 0)
          {
            for (int i = 0; i < m_numSavedRdModeFirstColorSpace[m_savedRdModeIdx]; i++)
            {
              uiRdModeList.push_back(m_savedRdModeFirstColorSpace[m_savedRdModeIdx][i]);
            }
          }
    
          if (mtsUsageFlag != 2)
    
    fan wang's avatar
    fan wang committed
    #if JVET_AB0155_SGPM
            if (testSgpm && SGPMSaveFlag)
            {
              for (int i = 0; i < NUM_LUMA_MODE; i++)
              {
                m_intraModeReady[i] = 0;
              }
            }
    #endif
    
            // this should always be true
            CHECK(!pu.Y().valid(), "PU is not valid");
    
    #if !JVET_AB0157_TMRL
    
            bool isFirstLineOfCtu     = (((pu.block(COMPONENT_Y).y) & ((pu.cs->sps)->getMaxCUWidth() - 1)) == 0);
    
    #if JVET_Y0116_EXTENDED_MRL_LIST
            int  numOfPassesExtendRef = MRL_NUM_REF_LINES;
            if (!sps.getUseMRL() || isFirstLineOfCtu) 
            {
              numOfPassesExtendRef = 1;
            }
            else
            {
              bool checkLineOutsideCtu[MRL_NUM_REF_LINES - 1];
              for (int mrlIdx = 1; mrlIdx < MRL_NUM_REF_LINES; mrlIdx++)
              {
                bool isLineOutsideCtu =
                  ((cu.block(COMPONENT_Y).y) % ((cu.cs->sps)->getMaxCUWidth()) <= MULTI_REF_LINE_IDX[mrlIdx]) ? true
                                                                                                              : false;
                checkLineOutsideCtu[mrlIdx-1] = isLineOutsideCtu;
              }
              if (checkLineOutsideCtu[0]) 
              {
                numOfPassesExtendRef = 1;
              }
              else
              {
                for (int mrlIdx = MRL_NUM_REF_LINES - 2; mrlIdx > 0; mrlIdx--)
                {
                  if (checkLineOutsideCtu[mrlIdx] && !checkLineOutsideCtu[mrlIdx - 1])
                  {
                    numOfPassesExtendRef = mrlIdx + 1;
                    break;
                  }
                }
              }
            }
    #else
    
            int  numOfPassesExtendRef = ((!sps.getUseMRL() || isFirstLineOfCtu) ? 1 : MRL_NUM_REF_LINES);
    
            pu.multiRefIdx            = 0;
    
    #if JVET_AB0157_TMRL
            cu.tmrlFlag = false;
    #endif
    
            if (numModesForFullRD != numModesAvailable)
    
              CHECK(numModesForFullRD >= numModesAvailable, "Too many modes for full RD search");
    
    fan wang's avatar
    fan wang committed
    #if !JVET_AB0155_SGPM
    
              const CompArea &area = pu.Y();
    
    fan wang's avatar
    fan wang committed
    #endif
    
              PelBuf piOrg  = cs.getOrgBuf(area);
              PelBuf piPred = cs.getPredBuf(area);
    
              DistParam distParamSad;
              DistParam distParamHad;
    
              if (cu.slice->getLmcsEnabledFlag() && m_pcReshape->getCTUFlag())
    
    fan wang's avatar
    fan wang committed
    #if !JVET_AB0155_SGPM
    
                CompArea tmpArea(COMPONENT_Y, area.chromaFormat, Position(0, 0), area.size());
    
    fan wang's avatar
    fan wang committed
    #endif
    
                PelBuf   tmpOrg = m_tmpStorageLCU.getBuf(tmpArea);
    
    Vadim Seregin's avatar
    Vadim Seregin committed
                tmpOrg.rspSignal( piOrg, m_pcReshape->getFwdLUT() );
    
                m_pcRdCost->setDistParam(distParamSad, tmpOrg, piPred, sps.getBitDepth(CHANNEL_TYPE_LUMA), COMPONENT_Y,
                                         false);   // Use SAD cost
                m_pcRdCost->setDistParam(distParamHad, tmpOrg, piPred, sps.getBitDepth(CHANNEL_TYPE_LUMA), COMPONENT_Y,
                                         true);   // Use HAD (SATD) cost
    
              else
    
                m_pcRdCost->setDistParam(distParamSad, piOrg, piPred, sps.getBitDepth(CHANNEL_TYPE_LUMA), COMPONENT_Y,
                                         false);   // Use SAD cost
                m_pcRdCost->setDistParam(distParamHad, piOrg, piPred, sps.getBitDepth(CHANNEL_TYPE_LUMA), COMPONENT_Y,
                                         true);   // Use HAD (SATD) cost
    
              distParamSad.applyWeight = false;
              distParamHad.applyWeight = false;
    
              if (testMip && supportedMipBlkSize)
              {
                numModesForFullRD += fastMip
                                       ? std::max(numModesForFullRD, floorLog2(std::min(pu.lwidth(), pu.lheight())) - 1)
                                       : numModesForFullRD;
              }
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if JVET_V0130_INTRA_TMP
    
    #if JVET_AB0130_ITMP_SAMPLING
              if (testTpm && !m_pcEncCfg->getUseFastIntraTMP())
    #else
    
    Vadim Seregin's avatar
    Vadim Seregin committed
              if( testTpm )
    
    Vadim Seregin's avatar
    Vadim Seregin committed
              {
                numModesForFullRD += 1; // testing tpm
              }
              const int numHadCand = (testMip ? 2 : 1) * 3 + testTpm;
              
              cu.tmpFlag = false;
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #else
    
              const int numHadCand = (testMip ? 2 : 1) * 3;
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #endif
    
    fan wang's avatar
    fan wang committed
    #if JVET_AB0155_SGPM
              static_vector<SgpmInfo, SGPM_NUM> sgpmInfoList;
              static_vector<double, SGPM_NUM>   sgpmCostList;
              int                               sgpmNeededMode[NUM_LUMA_MODE] = {0};
    
              if (testSgpm && SGPMSaveFlag)
              {
                deriveSgpmModeOrdered(bestCS->picture->getRecoBuf(area), area, cu, sgpmInfoList, sgpmCostList);
                for (int sgpmIdx = 0; sgpmIdx < SGPM_NUM; sgpmIdx++)
                {
                  int      sgpmMode[2];
                  sgpmMode[0]                 = sgpmInfoList[sgpmIdx].sgpmMode0;
                  sgpmMode[1]                 = sgpmInfoList[sgpmIdx].sgpmMode1;
                  sgpmNeededMode[sgpmMode[0]] = 1;
                  sgpmNeededMode[sgpmMode[1]] = 1;
                }
              }
    #endif
    
    
    #if JVET_AB0157_TMRL
              double tmrlCostList[MRL_LIST_SIZE]{ MAX_DOUBLE };
    #endif
    
    #if JVET_AC0105_DIRECTIONAL_PLANAR
              double dirPlanarCostList[2]{ MAX_DOUBLE };
    #endif
    
              //*** Derive (regular) candidates using Hadamard
              cu.mipFlag = false;
    
              //===== init pattern for luma prediction =====
    
    #if JVET_AB0157_INTRA_FUSION && JVET_AB0155_SGPM
              initIntraPatternChType(cu, pu.Y(), true, 0, false);
    #elif JVET_AB0157_INTRA_FUSION
    
              initIntraPatternChType(cu, pu.Y(), true, false);
    #else
    
              initIntraPatternChType(cu, pu.Y(), true);
    
              bool bSatdChecked[NUM_INTRA_MODE];
              memset(bSatdChecked, 0, sizeof(bSatdChecked));
    
              if (!LFNSTLoadFlag)
              {
                for (int modeIdx = 0; modeIdx < numModesAvailable; modeIdx++)
                {
                  uint32_t   uiMode    = modeIdx;
                  Distortion minSadHad = 0;
    
                  // Skip checking extended Angular modes in the first round of SATD
                  if (uiMode > DC_IDX && (uiMode & 1))
                  {
                    continue;
    
                  bSatdChecked[uiMode] = true;
    
                  pu.intraDir[0] = modeIdx;
    
                  initPredIntraParams(pu, pu.Y(), sps);
    
    #if JVET_AB0157_INTRA_FUSION
                  predIntraAng(COMPONENT_Y, piPred, pu, false);
    #else
    
                  predIntraAng(COMPONENT_Y, piPred, pu);
    
    fan wang's avatar
    fan wang committed
    #if JVET_AB0155_SGPM
                  if (testSgpm && SGPMSaveFlag && sgpmNeededMode[uiMode])
                  {
                    PelBuf   predBuf(m_intraPredBuf[uiMode], tmpArea);
                    predBuf.copyFrom(piPred);
                    m_intraModeReady[uiMode] = 1;
                  }
    #endif
    
    
                  // Use the min between SAD and HAD as the cost criterion
    
                  // SAD is scaled by 2 to align with the scaling of HAD
    
                  minSadHad += std::min(distParamSad.distFunc(distParamSad) * 2, distParamHad.distFunc(distParamHad));
    
    
                  // NB xFracModeBitsIntra will not affect the mode for chroma that may have already been pre-estimated.
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if JVET_V0130_INTRA_TMP
                  m_CABACEstimator->getCtx() = SubCtx( Ctx::TmpFlag, ctxStartTpmFlag );
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #endif
    
                  m_CABACEstimator->getCtx() = SubCtx( Ctx::MipFlag, ctxStartMipFlag );
    
    Keming Cao's avatar
    Keming Cao committed
    #if JVET_W0123_TIMD_FUSION
                  m_CABACEstimator->getCtx() = SubCtx( Ctx::TimdFlag, ctxStartTimdFlag );
    #endif
    
    fan wang's avatar
    fan wang committed
    #if JVET_AB0155_SGPM
                  m_CABACEstimator->getCtx() = SubCtx(Ctx::SgpmFlag, ctxStartSgpmFlag);
    #endif
    
    
                  m_CABACEstimator->getCtx() = SubCtx( Ctx::ISPMode, ctxStartIspMode );
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if SECONDARY_MPM
                  m_CABACEstimator->getCtx() = SubCtx(Ctx::IntraLumaMPMIdx, ctxStartMPMIdxFlag);
    #endif
    
                  m_CABACEstimator->getCtx() = SubCtx(Ctx::IntraLumaPlanarFlag, ctxStartPlanarFlag);
    
    Frank Bossen's avatar
    Frank Bossen committed
                  m_CABACEstimator->getCtx() = SubCtx(Ctx::IntraLumaMpmFlag, ctxStartIntraMode);
    
    Vadim Seregin's avatar
    Vadim Seregin committed
    #if SECONDARY_MPM
                  m_CABACEstimator->getCtx() = SubCtx(Ctx::IntraLumaSecondMpmFlag, ctxStartIntraMode2);
    #endif
    
    Paul Keydel's avatar
    Paul Keydel committed
                  m_CABACEstimator->getCtx() = SubCtx( Ctx::MultiRefLineIdx, ctxStartMrlIdx );
    
    #if JVET_AB0157_TMRL
                  m_CABACEstimator->getCtx() = SubCtx(Ctx::TmrlDerive, ctxStartTmrlDerive);
    #endif
    
                  uint64_t fracModeBits = xFracModeBitsIntra(pu, uiMode, CHANNEL_TYPE_LUMA);
    
                  double cost = (double) minSadHad + (double) fracModeBits * sqrtLambdaForFirstPass;
    
                  DTRACE(g_trace_ctx, D_INTRA_COST, "IntraHAD: %u, %llu, %f (%d)\n", minSadHad, fracModeBits, cost, uiMode);
    
                  updateCandList(ModeInfo(false, false, 0, NOT_INTRA_SUBPARTITIONS, uiMode), cost, uiRdModeList,
                                 CandCostList, numModesForFullRD);
                  updateCandList(ModeInfo(false, false, 0, NOT_INTRA_SUBPARTITIONS, uiMode), double(minSadHad),
                                 uiHadModeList, CandHadList, numHadCand);
                }
    
    #if JVET_AC0105_DIRECTIONAL_PLANAR
                bool testDirPlanar = isLuma(partitioner.chType);
                if (testDirPlanar)
                {
                  for (int dirPlanarModeIdx = 0; dirPlanarModeIdx < 2; dirPlanarModeIdx++)
                  {
                    cu.sgpm        = false;
                    cu.ispMode     = 0;
                    cu.tmpFlag     = false;
                    cu.tmrlFlag    = false;
                    pu.multiRefIdx = 0;
                    cu.mipFlag     = false;
                    pu.intraDir[0] = PLANAR_IDX;
                    cu.plIdx       = dirPlanarModeIdx + 1;
    
                    initPredIntraParams(pu, pu.Y(), sps);
    #if JVET_AB0157_INTRA_FUSION
                    predIntraAng(COMPONENT_Y, piPred, pu, false);
    #else
                    predIntraAng(COMPONENT_Y, piPred, pu);
    #endif
    
                    // Use the min between SAD and SATD as the cost criterion
                    // SAD is scaled by 2 to align with the scaling of HAD
                    Distortion minSadHad =
                      std::min(distParamSad.distFunc(distParamSad) * 2, distParamHad.distFunc(distParamHad));
    
                    // NB xFracModeBitsIntra will not affect the mode for chroma that may have already been
                    // pre-estimated.
    #if JVET_V0130_INTRA_TMP
                    m_CABACEstimator->getCtx() = SubCtx(Ctx::TmpFlag, ctxStartTpmFlag);
    #endif
                    m_CABACEstimator->getCtx() = SubCtx(Ctx::MipFlag, ctxStartMipFlag);
    #if JVET_W0123_TIMD_FUSION
                    m_CABACEstimator->getCtx() = SubCtx(Ctx::TimdFlag, ctxStartTimdFlag);
    #endif
    #if JVET_AB0155_SGPM
                    m_CABACEstimator->getCtx() = SubCtx(Ctx::SgpmFlag, ctxStartSgpmFlag);
    #endif
                    m_CABACEstimator->getCtx() = SubCtx(Ctx::ISPMode, ctxStartIspMode);
    #if SECONDARY_MPM
                    m_CABACEstimator->getCtx() = SubCtx(Ctx::IntraLumaMPMIdx, ctxStartMPMIdxFlag);
    #endif
                    m_CABACEstimator->getCtx() = SubCtx(Ctx::IntraLumaPlanarFlag, ctxStartPlanarFlag);
                    m_CABACEstimator->getCtx() = SubCtx(Ctx::IntraLumaMpmFlag, ctxStartIntraMode);
    #if SECONDARY_MPM
                    m_CABACEstimator->getCtx() = SubCtx(Ctx::IntraLumaSecondMpmFlag, ctxStartIntraMode2);
    #endif
                    m_CABACEstimator->getCtx() = SubCtx(Ctx::MultiRefLineIdx, ctxStartMrlIdx);
    #if JVET_AB0157_TMRL
                    m_CABACEstimator->getCtx() = SubCtx(Ctx::TmrlDerive, ctxStartTmrlDerive);
    #endif
    
                    uint64_t fracModeBits = xFracModeBitsIntra(pu, PLANAR_IDX, CHANNEL_TYPE_LUMA);
                    double cost = (double) minSadHad + (double) fracModeBits * sqrtLambdaForFirstPass;
    
                    updateCandList(
                      ModeInfo(false, false, 0, NOT_INTRA_SUBPARTITIONS, dirPlanarModeIdx ? PL_VER_IDX : PL_HOR_IDX), cost,
                      uiRdModeList, CandCostList, numModesForFullRD);
                    updateCandList(
                      ModeInfo(false, false, 0, NOT_INTRA_SUBPARTITIONS, dirPlanarModeIdx ? PL_VER_IDX : PL_HOR_IDX),
                      double(minSadHad), uiHadModeList, CandHadList, numHadCand);
                    dirPlanarCostList[dirPlanarModeIdx] = cost;
                  }
                }
                cu.plIdx = 0;
    #endif
    
                if (!sps.getUseMIP() && LFNSTSaveFlag)
                {
                  // save found best modes
                  m_uiSavedNumRdModesLFNST = numModesForFullRD;
                  m_uiSavedRdModeListLFNST = uiRdModeList;
                  m_dSavedModeCostLFNST    = CandCostList;
                  // PBINTRA fast
                  m_uiSavedHadModeListLFNST = uiHadModeList;
                  m_dSavedHadListLFNST      = CandHadList;