/**************************************************************************
 *
 * Copyright 2013 Advanced Micro Devices, Inc.
 *
 * SPDX-License-Identifier: MIT
 *
 **************************************************************************/

#include "pipe/p_video_codec.h"
#include "radeon_vce.h"
#include "radeon_video.h"
#include "si_pipe.h"
#include "util/u_memory.h"
#include "util/u_video.h"
#include "vl/vl_video_buffer.h"

#include <stdio.h>

static void session(struct rvce_encoder *enc)
{
   RVCE_BEGIN(0x00000001); // session cmd
   RVCE_CS(enc->stream_handle);
   RVCE_END();
}

static void task_info(struct rvce_encoder *enc, uint32_t op, uint32_t dep, uint32_t fb_idx,
                      uint32_t ring_idx)
{
   RVCE_BEGIN(0x00000002); // task info
   if (op == 0x3) {
      if (enc->task_info_idx) {
         uint32_t offs = enc->cs.current.cdw - enc->task_info_idx + 3;
         // Update offsetOfNextTaskInfo
         enc->cs.current.buf[enc->task_info_idx] = offs;
      }
      enc->task_info_idx = enc->cs.current.cdw;
   }
   RVCE_CS(0xffffffff); // offsetOfNextTaskInfo
   RVCE_CS(op);         // taskOperation
   RVCE_CS(dep);        // referencePictureDependency
   RVCE_CS(0x00000000); // collocateFlagDependency
   RVCE_CS(fb_idx);     // feedbackIndex
   RVCE_CS(ring_idx);   // videoBitstreamRingIndex
   RVCE_END();
}

static void feedback(struct rvce_encoder *enc)
{
   RVCE_BEGIN(0x05000005);                                    // feedback buffer
   RVCE_WRITE(enc->fb->res->buf, enc->fb->res->domains, 0x0); // feedbackRingAddressHi/Lo
   RVCE_CS(0x00000001);                                       // feedbackRingSize
   RVCE_END();
}

static void create(struct rvce_encoder *enc)
{
   enc->task_info(enc, 0x00000000, 0, 0, 0);

   RVCE_BEGIN(0x01000001);                                            // create cmd
   RVCE_CS(0x00000000);                                               // encUseCircularBuffer
   RVCE_CS(u_get_h264_profile_idc(enc->base.profile));                // encProfile
   RVCE_CS(enc->pic.seq.level_idc);                                   // encLevel
   RVCE_CS(0x00000000);                                               // encPicStructRestriction
   RVCE_CS(enc->base.width);                                          // encImageWidth
   RVCE_CS(enc->base.height);                                         // encImageHeight
   RVCE_CS(enc->luma->u.legacy.level[0].nblk_x * enc->luma->bpe);     // encRefPicLumaPitch
   RVCE_CS(enc->chroma->u.legacy.level[0].nblk_x * enc->chroma->bpe); // encRefPicChromaPitch
   RVCE_CS(align(enc->luma->u.legacy.level[0].nblk_y, 16) / 8);       // encRefYHeightInQw
   RVCE_CS(0x00000000); // encRefPic(Addr|Array)Mode, encPicStructRestriction, disableRDO
   RVCE_END();
}

static void rate_control(struct rvce_encoder *enc)
{
   uint32_t target_bits_picture =
      enc->pic.rate_ctrl[0].target_bitrate *
      ((float)enc->pic.rate_ctrl[0].frame_rate_den /
      enc->pic.rate_ctrl[0].frame_rate_num);
   uint32_t peak_bits_picture_integer =
      enc->pic.rate_ctrl[0].peak_bitrate *
      ((float)enc->pic.rate_ctrl[0].frame_rate_den /
      enc->pic.rate_ctrl[0].frame_rate_num);
   uint32_t peak_bits_picture_fraction =
      (((enc->pic.rate_ctrl[0].peak_bitrate *
      (uint64_t)enc->pic.rate_ctrl[0].frame_rate_den) %
      enc->pic.rate_ctrl[0].frame_rate_num) << 32) /
      enc->pic.rate_ctrl[0].frame_rate_num;

   RVCE_BEGIN(0x04000005);                                 // rate control
   RVCE_CS(enc->pic.rate_ctrl[0].rate_ctrl_method);           // encRateControlMethod
   RVCE_CS(enc->pic.rate_ctrl[0].target_bitrate);             // encRateControlTargetBitRate
   RVCE_CS(enc->pic.rate_ctrl[0].peak_bitrate);               // encRateControlPeakBitRate
   RVCE_CS(enc->pic.rate_ctrl[0].frame_rate_num);             // encRateControlFrameRateNum
   RVCE_CS(0x00000000);                                    // encGOPSize
   RVCE_CS(enc->pic.quant_i_frames);                       // encQP_I
   RVCE_CS(enc->pic.quant_p_frames);                       // encQP_P
   RVCE_CS(enc->pic.quant_b_frames);                       // encQP_B
   RVCE_CS(enc->pic.rate_ctrl[0].vbv_buffer_size);            // encVBVBufferSize
   RVCE_CS(enc->pic.rate_ctrl[0].frame_rate_den);             // encRateControlFrameRateDen
   RVCE_CS(0x00000000);                                    // encVBVBufferLevel
   RVCE_CS(0x00000000);                                    // encMaxAUSize
   RVCE_CS(0x00000000);                                    // encQPInitialMode
   RVCE_CS(target_bits_picture);                           // encTargetBitsPerPicture
   RVCE_CS(peak_bits_picture_integer);                     // encPeakBitsPerPictureInteger
   RVCE_CS(peak_bits_picture_fraction);                    // encPeakBitsPerPictureFractional
   RVCE_CS(0x00000000);                                    // encMinQP
   RVCE_CS(0x00000033);                                    // encMaxQP
   RVCE_CS(0x00000000);                                    // encSkipFrameEnable
   RVCE_CS(0x00000000);                                    // encFillerDataEnable
   RVCE_CS(0x00000000);                                    // encEnforceHRD
   RVCE_CS(0x00000000);                                    // encBPicsDeltaQP
   RVCE_CS(0x00000000);                                    // encReferenceBPicsDeltaQP
   RVCE_CS(0x00000000);                                    // encRateControlReInitDisable
   RVCE_END();
}

static void config_extension(struct rvce_encoder *enc)
{
   RVCE_BEGIN(0x04000001); // config extension
   RVCE_CS(0x00000003);    // encEnablePerfLogging
   RVCE_END();
}

static void pic_control(struct rvce_encoder *enc)
{
   unsigned encNumMBsPerSlice;

   encNumMBsPerSlice = align(enc->base.width, 16) / 16;
   encNumMBsPerSlice *= align(enc->base.height, 16) / 16;

   RVCE_BEGIN(0x04000002);                                         // pic control
   RVCE_CS(0x00000000);                                            // encUseConstrainedIntraPred
   RVCE_CS(0x00000000);                                            // encCABACEnable
   RVCE_CS(0x00000000);                                            // encCABACIDC
   RVCE_CS(0x00000000);                                            // encLoopFilterDisable
   RVCE_CS(0x00000000);                                            // encLFBetaOffset
   RVCE_CS(0x00000000);                                            // encLFAlphaC0Offset
   RVCE_CS(0x00000000);                                            // encCropLeftOffset
   RVCE_CS((align(enc->base.width, 16) - enc->base.width) >> 1);   // encCropRightOffset
   RVCE_CS(0x00000000);                                            // encCropTopOffset
   RVCE_CS((align(enc->base.height, 16) - enc->base.height) >> 1); // encCropBottomOffset
   RVCE_CS(encNumMBsPerSlice);                                     // encNumMBsPerSlice
   RVCE_CS(0x00000000);                                            // encIntraRefreshNumMBsPerSlot
   RVCE_CS(0x00000000);                                            // encForceIntraRefresh
   RVCE_CS(0x00000000);                                            // encForceIMBPeriod
   RVCE_CS(0x00000000);                                            // encPicOrderCntType
   RVCE_CS(0x00000000);                            // log2_max_pic_order_cnt_lsb_minus4
   RVCE_CS(0x00000000);                            // encSPSID
   RVCE_CS(0x00000000);                            // encPPSID
   RVCE_CS(0x00000040);                            // encConstraintSetFlags
   RVCE_CS(MAX2(enc->base.max_references, 1) - 1); // encBPicPattern
   RVCE_CS(0x00000000);                            // weightPredModeBPicture
   RVCE_CS(MIN2(enc->base.max_references, 2));     // encNumberOfReferenceFrames
   RVCE_CS(enc->base.max_references + 1);          // encMaxNumRefFrames
   RVCE_CS(0x00000001);                            // encNumDefaultActiveRefL0
   RVCE_CS(0x00000001);                            // encNumDefaultActiveRefL1
   RVCE_CS(0x00000000);                            // encSliceMode
   RVCE_CS(0x00000000);                            // encMaxSliceSize
   RVCE_END();
}

static void motion_estimation(struct rvce_encoder *enc)
{
   RVCE_BEGIN(0x04000007); // motion estimation
   RVCE_CS(0x00000001);    // encIMEDecimationSearch
   RVCE_CS(0x00000001);    // motionEstHalfPixel
   RVCE_CS(0x00000000);    // motionEstQuarterPixel
   RVCE_CS(0x00000000);    // disableFavorPMVPoint
   RVCE_CS(0x00000000);    // forceZeroPointCenter
   RVCE_CS(0x00000000);    // LSMVert
   RVCE_CS(0x00000010);    // encSearchRangeX
   RVCE_CS(0x00000010);    // encSearchRangeY
   RVCE_CS(0x00000010);    // encSearch1RangeX
   RVCE_CS(0x00000010);    // encSearch1RangeY
   RVCE_CS(0x00000000);    // disable16x16Frame1
   RVCE_CS(0x00000000);    // disableSATD
   RVCE_CS(0x00000000);    // enableAMD
   RVCE_CS(0x000000fe);    // encDisableSubMode
   RVCE_CS(0x00000000);    // encIMESkipX
   RVCE_CS(0x00000000);    // encIMESkipY
   RVCE_CS(0x00000000);    // encEnImeOverwDisSubm
   RVCE_CS(0x00000000);    // encImeOverwDisSubmNo
   RVCE_CS(0x00000001);    // encIME2SearchRangeX
   RVCE_CS(0x00000001);    // encIME2SearchRangeY
   RVCE_CS(0x00000000);    // parallelModeSpeedupEnable
   RVCE_CS(0x00000000);    // fme0_encDisableSubMode
   RVCE_CS(0x00000000);    // fme1_encDisableSubMode
   RVCE_CS(0x00000000);    // imeSWSpeedupEnable
   RVCE_END();
}

static void rdo(struct rvce_encoder *enc)
{
   RVCE_BEGIN(0x04000008); // rdo
   RVCE_CS(0x00000000);    // encDisableTbePredIFrame
   RVCE_CS(0x00000000);    // encDisableTbePredPFrame
   RVCE_CS(0x00000000);    // useFmeInterpolY
   RVCE_CS(0x00000000);    // useFmeInterpolUV
   RVCE_CS(0x00000000);    // useFmeIntrapolY
   RVCE_CS(0x00000000);    // useFmeIntrapolUV
   RVCE_CS(0x00000000);    // useFmeInterpolY_1
   RVCE_CS(0x00000000);    // useFmeInterpolUV_1
   RVCE_CS(0x00000000);    // useFmeIntrapolY_1
   RVCE_CS(0x00000000);    // useFmeIntrapolUV_1
   RVCE_CS(0x00000000);    // enc16x16CostAdj
   RVCE_CS(0x00000000);    // encSkipCostAdj
   RVCE_CS(0x00000000);    // encForce16x16skip
   RVCE_CS(0x00000000);    // encDisableThresholdCalcA
   RVCE_CS(0x00000000);    // encLumaCoeffCost
   RVCE_CS(0x00000000);    // encLumaMBCoeffCost
   RVCE_CS(0x00000000);    // encChromaCoeffCost
   RVCE_END();
}

static void vui(struct rvce_encoder *enc)
{
   int i;

   if (!enc->pic.rate_ctrl[0].frame_rate_num)
      return;

   RVCE_BEGIN(0x04000009);                     // vui
   RVCE_CS(0x00000000);                        // aspectRatioInfoPresentFlag
   RVCE_CS(0x00000000);                        // aspectRatioInfo.aspectRatioIdc
   RVCE_CS(0x00000000);                        // aspectRatioInfo.sarWidth
   RVCE_CS(0x00000000);                        // aspectRatioInfo.sarHeight
   RVCE_CS(0x00000000);                        // overscanInfoPresentFlag
   RVCE_CS(0x00000000);                        // overScanInfo.overscanAppropFlag
   RVCE_CS(0x00000000);                        // videoSignalTypePresentFlag
   RVCE_CS(0x00000005);                        // videoSignalTypeInfo.videoFormat
   RVCE_CS(0x00000000);                        // videoSignalTypeInfo.videoFullRangeFlag
   RVCE_CS(0x00000000);                        // videoSignalTypeInfo.colorDescriptionPresentFlag
   RVCE_CS(0x00000002);                        // videoSignalTypeInfo.colorPrim
   RVCE_CS(0x00000002);                        // videoSignalTypeInfo.transferChar
   RVCE_CS(0x00000002);                        // videoSignalTypeInfo.matrixCoef
   RVCE_CS(0x00000000);                        // chromaLocInfoPresentFlag
   RVCE_CS(0x00000000);                        // chromaLocInfo.chromaLocTop
   RVCE_CS(0x00000000);                        // chromaLocInfo.chromaLocBottom
   RVCE_CS(0x00000001);                        // timingInfoPresentFlag
   RVCE_CS(enc->pic.rate_ctrl[0].frame_rate_den); // timingInfo.numUnitsInTick
   RVCE_CS(enc->pic.rate_ctrl[0].frame_rate_num * 2); // timingInfo.timeScale;
   RVCE_CS(0x00000001);                            // timingInfo.fixedFrameRateFlag
   RVCE_CS(0x00000000);                            // nalHRDParametersPresentFlag
   RVCE_CS(0x00000000);                            // hrdParam.cpbCntMinus1
   RVCE_CS(0x00000004);                            // hrdParam.bitRateScale
   RVCE_CS(0x00000006);                            // hrdParam.cpbSizeScale
   for (i = 0; i < 32; i++) {
      RVCE_CS(0x00000000); // hrdParam.bitRateValueMinus
      RVCE_CS(0x00000000); // hrdParam.cpbSizeValueMinus
      RVCE_CS(0x00000000); // hrdParam.cbrFlag
   }
   RVCE_CS(0x00000017); // hrdParam.initialCpbRemovalDelayLengthMinus1
   RVCE_CS(0x00000017); // hrdParam.cpbRemovalDelayLengthMinus1
   RVCE_CS(0x00000017); // hrdParam.dpbOutputDelayLengthMinus1
   RVCE_CS(0x00000018); // hrdParam.timeOffsetLength
   RVCE_CS(0x00000000); // lowDelayHRDFlag
   RVCE_CS(0x00000000); // picStructPresentFlag
   RVCE_CS(0x00000000); // bitstreamRestrictionPresentFlag
   RVCE_CS(0x00000001); // bitstreamRestrictions.motionVectorsOverPicBoundariesFlag
   RVCE_CS(0x00000002); // bitstreamRestrictions.maxBytesPerPicDenom
   RVCE_CS(0x00000001); // bitstreamRestrictions.maxBitsPerMbDenom
   RVCE_CS(0x00000010); // bitstreamRestrictions.log2MaxMvLengthHori
   RVCE_CS(0x00000010); // bitstreamRestrictions.log2MaxMvLengthVert
   RVCE_CS(0x00000003); // bitstreamRestrictions.numReorderFrames
   RVCE_CS(0x00000003); // bitstreamRestrictions.maxDecFrameBuffering
   RVCE_END();
}

static void config(struct rvce_encoder *enc)
{
   enc->task_info(enc, 0x00000002, 0, 0xffffffff, 0);
   enc->rate_control(enc);
   enc->config_extension(enc);
   enc->motion_estimation(enc);
   enc->rdo(enc);
   if (enc->use_vui)
      enc->vui(enc);
   enc->pic_control(enc);
}

static void encode(struct rvce_encoder *enc)
{
   signed luma_offset, chroma_offset;
   int i;

   enc->task_info(enc, 0x00000003, 0, 0, 0);

   RVCE_BEGIN(0x05000001);                                        // context buffer
   RVCE_READWRITE(enc->cpb.res->buf, enc->cpb.res->domains, 0x0); // encodeContextAddressHi/Lo
   RVCE_END();

   RVCE_BEGIN(0x05000004);                             // video bitstream buffer
   RVCE_WRITE(enc->bs_handle, RADEON_DOMAIN_GTT, 0x0); // videoBitstreamRingAddressHi/Lo
   RVCE_CS(enc->bs_size);                              // videoBitstreamRingSize
   RVCE_END();

   RVCE_BEGIN(0x03000001); // encode
   RVCE_CS(0x00000000);    // insertHeaders
   RVCE_CS(0x00000000);    // pictureStructure
   RVCE_CS(enc->bs_size);  // allowedMaxBitstreamSize
   RVCE_CS(0x00000000);    // forceRefreshMap
   RVCE_CS(0x00000000);    // insertAUD
   RVCE_CS(0x00000000);    // endOfSequence
   RVCE_CS(0x00000000);    // endOfStream
   RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
             (uint64_t)enc->luma->u.legacy.level[0].offset_256B * 256); // inputPictureLumaAddressHi/Lo
   RVCE_READ(enc->handle, RADEON_DOMAIN_VRAM,
             (uint64_t)enc->chroma->u.legacy.level[0].offset_256B * 256);              // inputPictureChromaAddressHi/Lo
   RVCE_CS(align(enc->luma->u.legacy.level[0].nblk_y, 16));       // encInputFrameYPitch
   RVCE_CS(enc->luma->u.legacy.level[0].nblk_x * enc->luma->bpe); // encInputPicLumaPitch
   RVCE_CS(enc->chroma->u.legacy.level[0].nblk_x * enc->chroma->bpe); // encInputPicChromaPitch
   RVCE_CS(0x00000000);                                               // encInputPic(Addr|Array)Mode
   RVCE_CS(0x00000000);                                               // encInputPicTileConfig
   RVCE_CS(enc->pic.picture_type);                                    // encPicType
   RVCE_CS(enc->pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_IDR); // encIdrFlag
   RVCE_CS(0x00000000);                                               // encIdrPicId
   RVCE_CS(0x00000000);                                               // encMGSKeyPic
   RVCE_CS(!enc->pic.not_referenced);                                 // encReferenceFlag
   RVCE_CS(0x00000000);                                               // encTemporalLayerIndex
   RVCE_CS(0x00000000); // num_ref_idx_active_override_flag
   RVCE_CS(0x00000000); // num_ref_idx_l0_active_minus1
   RVCE_CS(0x00000000); // num_ref_idx_l1_active_minus1

   i = enc->pic.frame_num - enc->pic.ref_idx_l0_list[0];
   if (i > 1 && enc->pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_P) {
      RVCE_CS(0x00000001); // encRefListModificationOp
      RVCE_CS(i - 1);      // encRefListModificationNum
   } else {
      RVCE_CS(0x00000000); // encRefListModificationOp
      RVCE_CS(0x00000000); // encRefListModificationNum
   }

   for (i = 0; i < 3; ++i) {
      RVCE_CS(0x00000000); // encRefListModificationOp
      RVCE_CS(0x00000000); // encRefListModificationNum
   }
   for (i = 0; i < 4; ++i) {
      RVCE_CS(0x00000000); // encDecodedPictureMarkingOp
      RVCE_CS(0x00000000); // encDecodedPictureMarkingNum
      RVCE_CS(0x00000000); // encDecodedPictureMarkingIdx
      RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingOp
      RVCE_CS(0x00000000); // encDecodedRefBasePictureMarkingNum
   }

   // encReferencePictureL0[0]
   RVCE_CS(0x00000000); // pictureStructure
   if (enc->pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_P ||
       enc->pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_B) {
      struct rvce_cpb_slot *l0 = si_l0_slot(enc);
      si_vce_frame_offset(enc, l0, &luma_offset, &chroma_offset);
      RVCE_CS(l0->picture_type);  // encPicType
      RVCE_CS(l0->frame_num);     // frameNumber
      RVCE_CS(l0->pic_order_cnt); // pictureOrderCount
      RVCE_CS(luma_offset);       // lumaOffset
      RVCE_CS(chroma_offset);     // chromaOffset
   } else {
      RVCE_CS(0x00000000); // encPicType
      RVCE_CS(0x00000000); // frameNumber
      RVCE_CS(0x00000000); // pictureOrderCount
      RVCE_CS(0xffffffff); // lumaOffset
      RVCE_CS(0xffffffff); // chromaOffset
   }

   // encReferencePictureL0[1]
   RVCE_CS(0x00000000); // pictureStructure
   RVCE_CS(0x00000000); // encPicType
   RVCE_CS(0x00000000); // frameNumber
   RVCE_CS(0x00000000); // pictureOrderCount
   RVCE_CS(0xffffffff); // lumaOffset
   RVCE_CS(0xffffffff); // chromaOffset

   // encReferencePictureL1[0]
   RVCE_CS(0x00000000); // pictureStructure
   if (enc->pic.picture_type == PIPE_H2645_ENC_PICTURE_TYPE_B) {
      struct rvce_cpb_slot *l1 = si_l1_slot(enc);
      si_vce_frame_offset(enc, l1, &luma_offset, &chroma_offset);
      RVCE_CS(l1->picture_type);  // encPicType
      RVCE_CS(l1->frame_num);     // frameNumber
      RVCE_CS(l1->pic_order_cnt); // pictureOrderCount
      RVCE_CS(luma_offset);       // lumaOffset
      RVCE_CS(chroma_offset);     // chromaOffset
   } else {
      RVCE_CS(0x00000000); // encPicType
      RVCE_CS(0x00000000); // frameNumber
      RVCE_CS(0x00000000); // pictureOrderCount
      RVCE_CS(0xffffffff); // lumaOffset
      RVCE_CS(0xffffffff); // chromaOffset
   }

   si_vce_frame_offset(enc, si_current_slot(enc), &luma_offset, &chroma_offset);
   RVCE_CS(luma_offset);            // encReconstructedLumaOffset
   RVCE_CS(chroma_offset);          // encReconstructedChromaOffset
   RVCE_CS(0x00000000);             // encColocBufferOffset
   RVCE_CS(0x00000000);             // encReconstructedRefBasePictureLumaOffset
   RVCE_CS(0x00000000);             // encReconstructedRefBasePictureChromaOffset
   RVCE_CS(0x00000000);             // encReferenceRefBasePictureLumaOffset
   RVCE_CS(0x00000000);             // encReferenceRefBasePictureChromaOffset
   RVCE_CS(0x00000000);             // pictureCount
   RVCE_CS(enc->pic.frame_num);     // frameNumber
   RVCE_CS(enc->pic.pic_order_cnt); // pictureOrderCount
   RVCE_CS(0x00000000);             // numIPicRemainInRCGOP
   RVCE_CS(0x00000000);             // numPPicRemainInRCGOP
   RVCE_CS(0x00000000);             // numBPicRemainInRCGOP
   RVCE_CS(0x00000000);             // numIRPicRemainInRCGOP
   RVCE_CS(0x00000000);             // enableIntraRefresh
   RVCE_END();
}

static void destroy(struct rvce_encoder *enc)
{
   enc->task_info(enc, 0x00000001, 0, 0, 0);

   feedback(enc);

   RVCE_BEGIN(0x02000001); // destroy
   RVCE_END();
}

void si_vce_40_2_2_get_param(struct rvce_encoder *enc, struct pipe_h264_enc_picture_desc *pic)
{
}

void si_vce_40_2_2_init(struct rvce_encoder *enc)
{
   enc->session = session;
   enc->task_info = task_info;
   enc->create = create;
   enc->feedback = feedback;
   enc->rate_control = rate_control;
   enc->config_extension = config_extension;
   enc->pic_control = pic_control;
   enc->motion_estimation = motion_estimation;
   enc->rdo = rdo;
   enc->vui = vui;
   enc->config = config;
   enc->encode = encode;
   enc->destroy = destroy;
   enc->si_get_pic_param = si_vce_40_2_2_get_param;
}
