x265-1.7版本-encoder/weightPrediction.cpp注释

最新推荐文章于 2021-04-12 15:14:53 发布
cabbage2008
最新推荐文章于 2021-04-12 15:14:53 发布
阅读量1w
点赞数
分类专栏： x265代码注释
本文链接：https://blog.csdn.net/cabbage2008/article/details/50569744
版权
x265代码注释专栏收录该内容
74 篇文章 53 订阅
订阅专栏
注：问号以及未注释部分会在x265-1.8版本内更新
/*****************************************************************************
 * Copyright (C) 2013 x265 project
 *
 * Author: Shazeb Nawaz Khan <shazeb@multicorewareinc.com>
 *         Steve Borho <steve@borho.org>
 *         Kavitha Sampas <kavitha@multicorewareinc.com>
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02111, USA.
 *
 * This program is also available under a commercial proprietary license.
 * For more information, contact us at license @ x265.com.
 *****************************************************************************/

#include "common.h"
#include "frame.h"
#include "picyuv.h"
#include "lowres.h"
#include "slice.h"
#include "mv.h"
#include "bitstream.h"

using namespace x265;
namespace {
struct Cache //存储当前帧对应下采样帧信息 只应用于weightPrediciton.cpp
{
    const int * intraCost; //每个8x8块的intracost
    int         numPredDir;//当前list的个数
    int         csp;       //图像取样格式：420、444：400
    int         hshift;    //根据图像格式，色度宽度需要移位个数 如420格式 就是1
    int         vshift;    //根据图像格式，色度宽度需要移位个数 如420格式 就是1
    int         lowresWidthInCU;//下采样帧宽度有多少8x8
    int         lowresHeightInCU;//下采样帧高度有多少8x8
};
/** 函数功能             ： 获取头信息占用的cost
/*  调用范围             ： 只在weightAnalyse函数中被调用
* \参数 w                ： 权重系数
* \参数 lambda           ： QP=12下的lambda
* \参数 bChroma          ： 如果是色度为true 否则为false
* \返回                  ： 头信息占用的cost * */
int sliceHeaderCost(WeightParam *w, int lambda, int bChroma)
{
    /* 4 times higher, because chroma is analyzed at full resolution. */
    if (bChroma)
        lambda *= 4; //色度为全搜素所以乘以四(1/2下采样 ，对应就是4块)
    int denomCost = bs_size_ue(w[0].log2WeightDenom) * (2 - bChroma);//获得指数哥伦布码占用的cost  
    return lambda * (10 + denomCost + 2 * (bs_size_se(w[0].inputWeight) + bs_size_se(w[0].inputOffset)));//返回占用cost
}

/* make a motion compensated copy of lowres ref into mcout with the same stride.
 * The borders of mcout are not extended */
/** 函数功能             ： 按照MV的信息将参考帧的块copy到mcout去
/*  调用范围             ： 只在weightAnalyse函数中被调用
* \参数 mcout            ： 存储MC buffer
* \参数 ref              ： 参考帧对应的下采样视频
* \参数 mvs              ： 8x8块搜索的MV
* \返回                  ： null * */
void mcLuma(pixel* mcout, Lowres& ref, const MV * mvs)
{
    intptr_t stride = ref.lumaStride;//获取步长
    const int mvshift = 1 << 2;//1/4精度
    const int cuSize = 8;//8x8块
    MV mvmin, mvmax;

    int cu = 0;

    for (int y = 0; y < ref.lines; y += cuSize)//遍历所有行
    {
        intptr_t pixoff = y * stride;//离视频帧首地址的距离
        mvmin.y = (int16_t)((-y - 8) * mvshift);//最小mv，防止越向上越出图像边界
        mvmax.y = (int16_t)((ref.lines - y - 1 + 8) * mvshift);//最大mv，防止越向下越出图像边界

        for (int x = 0; x < ref.width; x += cuSize, pixoff += cuSize, cu++)//遍历当前行所以8x8块
        {
            ALIGN_VAR_16(pixel, buf8x8[8 * 8]);//暂存 buffer
            intptr_t bstride = 8;
            mvmin.x = (int16_t)((-x - 8) * mvshift);//最小mv，防止越向左越出图像边界
            mvmax.x = (int16_t)((ref.width - x - 1 + 8) * mvshift);//最大mv，防止越向右越出图像边界

            /* clip MV to available pixels */
            MV mv = mvs[cu];//获取当前MV
            mv = mv.clipped(mvmin, mvmax);//clip
            pixel *tmp = ref.lowresMC(pixoff, mv, buf8x8, bstride);//获取当前mv下的参考考数据块（分像素作伪插值操作）
            primitives.cu[BLOCK_8x8].copy_pp(mcout + pixoff, stride, tmp, bstride);//数据copy
        }
    }
}

/* use lowres MVs from lookahead to generate a motion compensated chroma plane.
 * if a block had cheaper lowres cost as intra, we treat it as MV 0 */
/** 函数功能             ： 按照MV的信息将参考帧的块copy到mcout去
/*  调用范围             ： 只在weightAnalyse函数中被调用
* \参数 mcout            ： 存储MC buffer
* \参数 src              ： 参考帧对应的色度帧(真实帧，不是下采样帧)
* \参数 stride           ： 步长
* \参数 mvs              ： 8x8块搜索的MV
* \参数 cache            ： 存储当前帧对应下采样帧信息
* \参数 height           ： 高度
* \参数 width            ： 宽度
* \返回                  ： null * */
void mcChroma(pixel *      mcout,
              pixel *      src,
              intptr_t     stride,
              const MV *   mvs,
              const Cache& cache,
              int          height,
              int          width)
{
    /* the motion vectors correspond to 8x8 lowres luma blocks, or 16x16 fullres
     * luma blocks. We have to adapt block size to chroma csp */
    int csp = cache.csp; //图像取样格式：420、444：400
    int bw = 16 >> cache.hshift;//选择相应块大小
    int bh = 16 >> cache.vshift;//选择相应块大小
    const int mvshift = 1 << 2;//1/4精度
    MV mvmin, mvmax;

    for (int y = 0; y < height; y += bh)//遍历行
    {
        /* note: lowres block count per row might be different from chroma block
         * count per row because of rounding issues, so be very careful with indexing
         * into the lowres structures */
        int cu = y * cache.lowresWidthInCU;
        intptr_t pixoff = y * stride; 离视频帧首地址的距离
        mvmin.y = (int16_t)((-y - 8) * mvshift);//最小mv，防止越向上越出图像边界
        mvmax.y = (int16_t)((height - y - 1 + 8) * mvshift);//最大mv，防止越向下越出图像边界

        for (int x = 0; x < width; x += bw, cu++, pixoff += bw)
        {
            if (x < cache.lowresWidthInCU && y < cache.lowresHeightInCU)//遍历当前行所以8x8块
            {
                MV mv = mvs[cu]; // lowres MV
                mv <<= 1;        // fullres MV
                mv.x >>= cache.hshift;
                mv.y >>= cache.vshift;

                /* clip MV to available pixels */
                mvmin.x = (int16_t)((-x - 8) * mvshift);
                mvmax.x = (int16_t)((width - x - 1 + 8) * mvshift);
                mv = mv.clipped(mvmin, mvmax);

                intptr_t fpeloffset = (mv.y >> 2) * stride + (mv.x >> 2);
                pixel *temp = src + pixoff + fpeloffset; //获取当前整像素寻找的位置

                int xFrac = mv.x & 0x7;
                int yFrac = mv.y & 0x7;
                if ((yFrac | xFrac) == 0)//根据分像素获得相应的插值
                {
                    primitives.chroma[csp].pu[LUMA_16x16].copy_pp(mcout + pixoff, stride, temp, stride);
                }
                else if (yFrac == 0)
                {
                    primitives.chroma[csp].pu[LUMA_16x16].filter_hpp(temp, stride, mcout + pixoff, stride, xFrac);
                }
                else if (xFrac == 0)
                {
                    primitives.chroma[csp].pu[LUMA_16x16].filter_vpp(temp, stride, mcout + pixoff, stride, yFrac);
                }
                else
                {
                    ALIGN_VAR_16(int16_t, imm[16 * (16 + NTAPS_CHROMA)]);
                    primitives.chroma[csp].pu[LUMA_16x16].filter_hps(temp, stride, imm, bw, xFrac, 1);
                    primitives.chroma[csp].pu[LUMA_16x16].filter_vsp(imm + ((NTAPS_CHROMA >> 1) - 1) * bw, bw, mcout + pixoff, stride, yFrac);
                }
            }
            else
            {
                primitives.chroma[csp].pu[LUMA_16x16].copy_pp(mcout + pixoff, stride, src + pixoff, stride);
            }
        }
    }
}

/* Measure sum of 8x8 satd costs between source frame and reference
 * frame (potentially weighted, potentially motion compensated). We
 * always use source images for this analysis since reference recon
 * pixels have unreliable availability */
/** 函数功能             ： 获取与运动补偿后参考帧间的SATD值 （如果WeightParam 不为null 则获取与加权运动补偿后参考帧间的SATD值）
/*  调用范围             ： 只在weightAnalyse函数中被调用
* \参数 fenc             ： 亮度下采样帧 或者 色度原始帧
* \参数 ref              ： 运动补偿后的参考帧
* \参数 weightTemp       ： 如果WeightParam 不为null 则会计算加权帧放入此区域  并用加权参考帧计算SATD
* \参数 stride           ： 步长
* \参数 cache            ： 存储当前帧对应下采样帧信息
* \参数 width            ： 宽度
* \参数 height           ： 高度
* \参数 WeightParam      ： 可能为NULL或者待搜索的量化参数
* \参数 bLuma            ： 亮度为true 否则为false
* \返回                  ： 原始块与补偿块的SATD值 * */
uint32_t weightCost(pixel *         fenc,
                    pixel *         ref,
                    pixel *         weightTemp,
                    intptr_t        stride,
                    const Cache &   cache,
                    int             width,
                    int             height,
                    WeightParam *   w,
                    bool            bLuma)
{
    if (w)
    {
        /* make a weighted copy of the reference plane */
        int offset = w->inputOffset << (X265_DEPTH - 8);
        int weight = w->inputWeight;
        int denom = w->log2WeightDenom;
        int round = denom ? 1 << (denom - 1) : 0;
        int correction = IF_INTERNAL_PREC - X265_DEPTH; /* intermediate interpolation depth */
        int pwidth = ((width + 15) >> 4) << 4;

        primitives.weight_pp(ref, weightTemp, stride, pwidth, height,
                             weight, round << correction, denom + correction, offset);//获得P帧加权参考帧
        ref = weightTemp;//更改当前参考帧
    }

    uint32_t cost = 0;
    pixel *f = fenc, *r = ref;

    if (bLuma)//亮度模式
    {
        int cu = 0;
        for (int y = 0; y < height; y += 8, r += 8 * stride, f += 8 * stride)
        {
            for (int x = 0; x < width; x += 8, cu++)
            {
                int cmp = primitives.pu[LUMA_8x8].satd(r + x, stride, f + x, stride);//计算SATD
                cost += X265_MIN(cmp, cache.intraCost[cu]);
            }
        }
    }
    else if (cache.csp == X265_CSP_I444) //色度 4:4:4
        for (int y = 0; y < height; y += 16, r += 16 * stride, f += 16 * stride)
            for (int x = 0; x < width; x += 16)
                cost += primitives.pu[LUMA_16x16].satd(r + x, stride, f + x, stride);//计算SATD
    else //色度 4:2:0 
        for (int y = 0; y < height; y += 8, r += 8 * stride, f += 8 * stride)
            for (int x = 0; x < width; x += 8)
                cost += primitives.pu[LUMA_8x8].satd(r + x, stride, f + x, stride);//计算SATD

    return cost;//返回SATD值
}
}

namespace x265 {
/** 函数功能             ： 分析加权信息(每个list的第一帧分析加权与否，其它不加权)
/*  调用范围             ： 只在WeightAnalysis::processTasks和FrameEncoder::compressFrame()函数中被调用
* \参数 slice            ： 当前帧的slice
* \参数 frame            ： 当前编码帧
* \参数 param            ： 当前配置参数
* \返回                  ： null * */
void weightAnalyse(Slice& slice, Frame& frame, x265_param& param)
{
    WeightParam wp[2][MAX_NUM_REF][3];//分别是list  refs  yuv
    PicYuv *fencPic = frame.m_fencPic;//获取当前编码原始帧
    Lowres& fenc    = frame.m_lowres;//获取对应下采样视频帧

    Cache cache;//存储当前帧对应下采样帧信息

    //初始化cache信息
    memset(&cache, 0, sizeof(cache));//初始化
    cache.intraCost = fenc.intraCost;//每个8x8块的intracost
    cache.numPredDir = slice.isInterP() ? 1 : 2;//获取当前list的个数
    cache.lowresWidthInCU = fenc.width >> 3;//获取下采样帧宽度有多少8x8
    cache.lowresHeightInCU = fenc.lines >> 3;//获取下采样帧高度有多少8x8
    cache.csp = fencPic->m_picCsp;//图像取样格式：420、444：400
    cache.hshift = CHROMA_H_SHIFT(cache.csp);//根据图像格式，色度宽度需要移位个数 如420格式 就是1
    cache.vshift = CHROMA_V_SHIFT(cache.csp);//根据图像格式，色度宽度需要移位个数 如420格式 就是1

    //申请内存 初始化数据
    /* Use single allocation for motion compensated ref and weight buffers */
    pixel *mcbuf = X265_MALLOC(pixel, 2 * fencPic->m_stride * fencPic->m_picHeight);//申请空间为两帧大小 用于存储运动补偿后的参考帧（经参考帧按照MV位置copy到相应区域）以及存储加权运动补偿块位置
    if (!mcbuf)
    {
        slice.disableWeights();//申请内存失败，关闭加权信息  一般不会进入
        return;
    }
    pixel *weightTemp = mcbuf + fencPic->m_stride * fencPic->m_picHeight;//存储加权运动补偿块位置

    int lambda = (int)x265_lambda_tab[X265_LOOKAHEAD_QP];//获取lamda 对应QP 12
    int curPoc = slice.m_poc; //获取当前poc
    const float epsilon = 1.f / 128.f; //ε= 1/128

    int chromaDenom, lumaDenom, denom;//权重系数左移位个数 
    chromaDenom = lumaDenom = 7;//设置默认值7
    int numpixels[3];//计算当前需要计算Y、U、V的像素数目
    int w16 = ((fencPic->m_picWidth  + 15) >> 4) << 4; //保证被16整除
    int h16 = ((fencPic->m_picHeight + 15) >> 4) << 4;//保证被16整除
    numpixels[0] = w16 * h16; //Y
    numpixels[1] = numpixels[2] = numpixels[0] >> (cache.hshift + cache.vshift);//U V

    //功能: 获取当前编码帧参考帧是否加权的信息
    //      1. 获取当前帧与参考帧（当前list的第一帧）的平均值 方差比值的开方 
    //      2. 确定chromaDenom值，保证 guessScale[1、2] < 127/（1<<chromaDenom）
    //      3. 确定当前list的第一个参考帧是否需要加权，并给出加权信息
    //      4. 如果当前亮度加权  色度分量加权情况不一致，则将色度全置成为加权
    //      5. 将当前list的其他帧（非第一帧）设置为 不加权
    for (int list = 0; list < cache.numPredDir; list++)//遍历list
    {
        WeightParam *weights = wp[list][0];//获取当前list的第一帧
        Frame *refFrame = slice.m_refPicList[list][0];//获取当前list的第一帧
        Lowres& refLowres = refFrame->m_lowres;//获取当前参考帧对应的下采样帧
        int diffPoc = abs(curPoc - refFrame->m_poc);//获取两个poc的差

        /* prepare estimates */
        float guessScale[3], fencMean[3], refMean[3];//三维 yuv  分别存储  √(原始帧方差/参考帧方差） 原始帧平均值  参考帧平均值   其中guessScale可以看作权重因子 
        //功能：获取当前帧与参考帧（当前list的第一帧）的平均值 方差比值的开方 
        for (int plane = 0; plane < 3; plane++)//遍历yuv
        {
            SET_WEIGHT(weights[plane], false, 1, 0, 0);//设置WeightParam类数据
            uint64_t fencVar = fenc.wp_ssd[plane] + !refLowres.wp_ssd[plane];//当前帧的Σ(x^2) - (Σx * Σx)/n = n*Variance (n倍的方差) 后面保证最小为1 不是0
            uint64_t refVar  = refLowres.wp_ssd[plane] + !refLowres.wp_ssd[plane];//参考帧的Σ(x^2) - (Σx * Σx)/n = n*Variance (n倍的方差) 后面保证最小为1 不是0
            guessScale[plane] = sqrt((float)fencVar / refVar);//两方差比值的开方
            fencMean[plane] = (float)fenc.wp_sum[plane] / (numpixels[plane]) / (1 << (X265_DEPTH - 8));//获取平均值
            refMean[plane]  = (float)refLowres.wp_sum[plane] / (numpixels[plane]) / (1 << (X265_DEPTH - 8));//参考帧的平均值
        }

        /* make sure both our scale factors fit */
        //确定chromaDenom值，保证 guessScale[1、2] < 127/（1<<chromaDenom）  ,保证加权后值小于127
        while (!list && chromaDenom > 0)
        {
            float thresh = 127.f / (1 << chromaDenom);
            if (guessScale[1] < thresh && guessScale[2] < thresh)
                break;
            chromaDenom--;
        }

        SET_WEIGHT(weights[1], false, 1 << chromaDenom, chromaDenom, 0); //设置色度参数
        SET_WEIGHT(weights[2], false, 1 << chromaDenom, chromaDenom, 0); //设置色度参数

        //相当于下面语句
        //{ 
        //(w).inputWeight = (1 << chromaDenom); 
        //(w).log2WeightDenom = (chromaDenom); 
        //(w).inputOffset = (0); 
        //(w).bPresentFlag = (false); 
        //}

        MV *mvs = NULL;//存储下采样8x8块的mv信息
        //功能： 确定当前list的第一个参考帧是否需要加权，并给出加权信息
        //       1.如果当前是色度，并且亮度判断为不加权，直接退出
        //       2.如果平均值相近，纹理特性相近，不加权，直接退出
        //       3.设置亮度，色度权重系数
        //       4.将参考视频帧的原始帧进行扩边
        //       5.获取运动补偿数据（亮度（下采样帧）色度（原始帧））
        //       6.计算原始块与补偿块的SATD值，如果为0 不加权 退出
        //       7.在一定区间内搜索并获取当前最优的scale(inputWeight) 最优cost 最优inputOffset 是否加权
        //       8.如果是lsit0 并且是亮度  更新mindenom 
        //       9.设置当前list当前分量下的加权信息
        for (int plane = 0; plane < 3; plane++)//遍历yuv
        {
            denom = plane ? chromaDenom : lumaDenom;//选取相应的权重系数左移位个数
            if (plane && !weights[0].bPresentFlag)  //如果当前是色度，并且亮度判断为不加权，直接退出
                break;

            /* Early termination */
            x265_emms();//清除MMX寄存器中的内容，即初始化（以避免和浮点数操作发生冲突）。
            //如果编码帧与参考帧的平均值绝对值差小于0.5 并且 1-√(原始帧方差/参考帧方差） < 1/128 前者表示平均值相近  后者表示纹理特性相近  则判断不加权
            if (fabsf(refMean[plane] - fencMean[plane]) < 0.5f && fabsf(1.f - guessScale[plane]) < epsilon)
            {
                SET_WEIGHT(weights[plane], 0, 1 << denom, denom, 0);
                continue;
            }

            //设置亮度，色度权重系数
            if (plane)//如果是色度
            {
                int scale = x265_clip3(0, 255, (int)(guessScale[plane] * (1 << denom) + 0.5f));//获取scale值 ，前面已经保证guessScale[plane]<127/(1 << denom)
                if (scale > 127)//scale太大，超出pixel范围 直接退出
                    continue;
                weights[plane].inputWeight = scale;//设置权重系数
            }
            else
            {
                weights[plane].setFromWeightAndOffset((int)(guessScale[plane] * (1 << denom) + 0.5f), 0, denom, !list);//设置相应数据:亮度权重系数
            }

            int mindenom = weights[plane].log2WeightDenom;//获取当前权重系数左移位个数（为了保证精度）
            int minscale = weights[plane].inputWeight;//获取当前权重系数  后面会在 (minscale-4,minscale+4)范围内搜索最优
            int minoff = 0;//获取当前最优的偏移

            //功能：将参考视频帧的原始帧进行扩边
            if (!plane && diffPoc <= param.bframes + 1)//如果当前是亮度并且编码帧与参考帧不能相隔太远(太远没有数据)
            {
                mvs = fenc.lowresMvs[list][diffPoc - 1];//获取下采样8x8块的mv信息

                /* test whether this motion search was performed by lookahead */
                if (mvs[0].x != 0x7FFF)//如果有数据
                {
                    /* reference chroma planes must be extended prior to being
                     * used as motion compensation sources */
                    if (!refFrame->m_bChromaExtended)//是否没有扩边过，已经扩边无须扩边
                    {
                        refFrame->m_bChromaExtended = true;//设置标记已经扩边
                        PicYuv *refPic = refFrame->m_fencPic;//获取参考视频的原始帧
                        int width = refPic->m_picWidth >> cache.hshift;//色度宽
                        int height = refPic->m_picHeight >> cache.vshift;//色度高
                        extendPicBorder(refPic->m_picOrg[1], refPic->m_strideC, width, height, refPic->m_chromaMarginX, refPic->m_chromaMarginY);//将视频帧进行扩边，便于插值和ME搜索
                        extendPicBorder(refPic->m_picOrg[2], refPic->m_strideC, width, height, refPic->m_chromaMarginX, refPic->m_chromaMarginY);//将视频帧进行扩边，便于插值和ME搜索
                    }
                }
                else
                    mvs = 0;//无数据返回0
            }

            /* prepare inputs to weight analysis */
            pixel *orig;//获取当前帧的下采样帧
            pixel *fref;//运动补偿数据
            intptr_t stride;//步长
            int    width, height;//宽、高
            //功能:获取运动补偿数据（亮度（下采样帧）色度（原始帧））
            switch (plane) //选择yuv分量
            {
            case 0://亮度
                orig = fenc.lowresPlane[0];
                stride = fenc.lumaStride;
                width = fenc.width;
                height = fenc.lines;
                fref = refLowres.lowresPlane[0];
                if (mvs)
                {
                    mcLuma(mcbuf, refLowres, mvs);//按照MV的信息将参考帧的块copy到mcout去
                    fref = mcbuf;
                }
                break;

            case 1://色度
                orig = fencPic->m_picOrg[1];
                stride = fencPic->m_strideC;
                fref = refFrame->m_fencPic->m_picOrg[1];

                /* Clamp the chroma dimensions to the nearest multiple of
                 * 8x8 blocks (or 16x16 for 4:4:4) since mcChroma uses lowres
                 * blocks and weightCost measures 8x8 blocks. This
                 * potentially ignores some edge pixels, but simplifies the
                 * logic and prevents reading uninitialized pixels. Lowres
                 * planes are border extended and require no clamping. */
                width =  ((fencPic->m_picWidth  >> 4) << 4) >> cache.hshift;
                height = ((fencPic->m_picHeight >> 4) << 4) >> cache.vshift;
                if (mvs)
                {
                    mcChroma(mcbuf, fref, stride, mvs, cache, height, width);//按照MV的信息将参考帧的块copy到mcout去
                    fref = mcbuf;
                }
                break;

            case 2://色度
                orig = fencPic->m_picOrg[2];
                stride = fencPic->m_strideC;
                fref = refFrame->m_fencPic->m_picOrg[2];
                width =  ((fencPic->m_picWidth  >> 4) << 4) >> cache.hshift;
                height = ((fencPic->m_picHeight >> 4) << 4) >> cache.vshift;
                if (mvs)
                {
                    mcChroma(mcbuf, fref, stride, mvs, cache, height, width);//按照MV的信息将参考帧的块copy到mcout去
                    fref = mcbuf;
                }
                break;

            default:
                slice.disableWeights();//关闭加权预测
                X265_FREE(mcbuf);
                return;
            }

            //计算原始块与补偿块的SATD值 SATD为零 继续
            uint32_t origscore = weightCost(orig, fref, weightTemp, stride, cache, width, height, NULL, !plane);
            if (!origscore)
            {
                SET_WEIGHT(weights[plane], 0, 1 << denom, denom, 0);//如果SATD为0，不用加权 退出
                continue;
            }

            uint32_t minscore = origscore;//存储当前最小的COST  SATD+bitcost
            bool bFound = false;//初始化不加权

            /* x264 uses a table lookup here, selecting search range based on preset */
            static const int scaleDist = 4;//用于搜索scale的区间
            static const int offsetDist = 2;//用于搜索offset的区间

            int startScale = x265_clip3(0, 127, minscale - scaleDist);
            int endScale   = x265_clip3(0, 127, minscale + scaleDist);
            //功能:在一定区间内搜索并获取当前最优的scale(inputWeight) 最优cost 最优inputOffset 是否加权
            //     1. 获取当前的权重系数绝对值是否大于127 是直接搜索下一个
            //     2. 计算偏移offset ,如果offset过大，先clip offset 再重新求scalse
            //     3. 获取当前最优的offset(整帧的偏移值)
            for (int scale = startScale; scale <= endScale; scale++)//在前面计算的基准上在(minscale - scaleDist,minscale + scaleDist）区间内搜索最优
            {
                int deltaWeight = scale - (1 << mindenom);   //判断偏移量
                if (deltaWeight > 127 || deltaWeight <= -128)
                    continue;

                x265_emms();  //清除MMX寄存器中的内容，即初始化（以避免和浮点数操作发生冲突）。
                int curScale = scale;//获取当前scale
                int curOffset = (int)(fencMean[plane] - refMean[plane] * curScale / (1 << mindenom) + 0.5f);// 可以理解为 求offset: enc - ref*w  w 就是前面√(原始帧方差/参考帧方差）  (在此是修正的值)
                if (curOffset < -128 || curOffset > 127)//一般不进入
                {
                    /* Rescale considering the constraints on curOffset. We do it in this order
                     * because scale has a much wider range than offset (because of denom), so
                     * it should almost never need to be clamped. */
                    curOffset = x265_clip3(-128, 127, curOffset);
                    curScale = (int)((1 << mindenom) * (fencMean[plane] - curOffset) / refMean[plane] + 0.5f);//重新求scale
                    curScale = x265_clip3(0, 127, curScale);
                }

                int startOffset = x265_clip3(-128, 127, curOffset - offsetDist);//设定开始搜索区间
                int endOffset   = x265_clip3(-128, 127, curOffset + offsetDist);//设定结束搜索区间
                //功能:获取当前最优的offset(整帧的偏移值)
                for (int off = startOffset; off <= endOffset; off++)
                {
                    WeightParam wsp;  //暂存当前搜索的权重系数
                    SET_WEIGHT(wsp, true, curScale, mindenom, off);//设置当前搜索的权重参数
                    uint32_t s = weightCost(orig, fref, weightTemp, stride, cache, width, height, &wsp, !plane) +
                                 sliceHeaderCost(&wsp, lambda, !!plane);//获取与加权运动补偿后参考帧间的SATD值 + slice头信息cost
                    COPY4_IF_LT(minscore, s, minscale, curScale, minoff, off, bFound, true);//选取最小cost

                    /* Don't check any more offsets if the previous one had a lower cost than the current one */
                    if (minoff == startOffset && off != startOffset)//发现一个更优就直接退出
                        break;
                }
            }//for (int scale = startScale; scale <= endScale; scale++)

            /* Use a smaller luma denominator if possible */
            if (!(plane || list)) //如果是lsit0 并且是亮度  更新mindenom  
            {
                while (mindenom > 0 && !(minscale & 1))
                {
                    mindenom--;
                    minscale >>= 1;
                }
            }

            if (!bFound || (minscale == (1 << mindenom) && minoff == 0) || (float)minscore / origscore > 0.998f)//不加权情况：前面搜索获得结果不加权   加权与否cost变化不大
            {
                SET_WEIGHT(weights[plane], false, 1 << denom, denom, 0);//设置不加权
            }
            else
            {
                SET_WEIGHT(weights[plane], true, minscale, mindenom, minoff);//设置加权
            }
        }//for (int plane = 0; plane < 3; plane++)//遍历yuv

        //如果当前亮度加权  色度分量加权情况不一致，则将色度全置成为加权(不加权的获取对应加权的信息)
        if (weights[0].bPresentFlag)
        {
            // Make sure both chroma channels match
            if (weights[1].bPresentFlag != weights[2].bPresentFlag)
            {
                if (weights[1].bPresentFlag)
                    weights[2] = weights[1];
                else
                    weights[1] = weights[2];
            }
        }

        lumaDenom = weights[0].log2WeightDenom;
        chromaDenom = weights[1].log2WeightDenom;

        /* reset weight states */
        //将当前list的其他帧（非第一帧）设置为 不加权
        for (int ref = 1; ref < slice.m_numRefIdx[list]; ref++)
        {
            SET_WEIGHT(wp[list][ref][0], false, 1 << lumaDenom, lumaDenom, 0);
            SET_WEIGHT(wp[list][ref][1], false, 1 << chromaDenom, chromaDenom, 0);
            SET_WEIGHT(wp[list][ref][2], false, 1 << chromaDenom, chromaDenom, 0);
        }
    } //for (int list = 0; list < cache.numPredDir; list++)

    X265_FREE(mcbuf);//释放内存

    memcpy(slice.m_weightPredTable, wp, sizeof(WeightParam) * 2 * MAX_NUM_REF * 3);//获取参考帧加权状态信息

    //打印log  如果加权则打印加权信息
    //样例：
    // x265 [full]: poc: 24 weights: [L0:R0 Y{63/64+1}U{98/128+25}V{123/128+6}]  w[0].inputWeight/1 << w[0].log2WeightDenom    w[0].inputOffset   加权信息  w* ref  + offset
    if (param.logLevel >= X265_LOG_FULL)
    {
        char buf[1024];
        int p = 0;
        bool bWeighted = false;

        p = sprintf(buf, "poc: %d weights:", slice.m_poc);
        int numPredDir = slice.isInterP() ? 1 : 2;
        for (int list = 0; list < numPredDir; list++)
        {
            WeightParam* w = &wp[list][0][0];
            if (w[0].bPresentFlag || w[1].bPresentFlag || w[2].bPresentFlag)
            {
                bWeighted = true;
                p += sprintf(buf + p, " [L%d:R0 ", list);
                if (w[0].bPresentFlag)
                    p += sprintf(buf + p, "Y{%d/%d%+d}", w[0].inputWeight, 1 << w[0].log2WeightDenom, w[0].inputOffset);
                if (w[1].bPresentFlag)
                    p += sprintf(buf + p, "U{%d/%d%+d}", w[1].inputWeight, 1 << w[1].log2WeightDenom, w[1].inputOffset);
                if (w[2].bPresentFlag)
                    p += sprintf(buf + p, "V{%d/%d%+d}", w[2].inputWeight, 1 << w[2].log2WeightDenom, w[2].inputOffset);
                p += sprintf(buf + p, "]");
            }
        }

        if (bWeighted)
        {
            if (p < 80) // pad with spaces to ensure progress line overwritten
                sprintf(buf + p, "%*s", 80 - p, " ");
            x265_log(¶m, X265_LOG_FULL, "%s\n", buf);
        }
    }
}
}