diff --git a/doc/software-manual.tex b/doc/software-manual.tex index cb20c45ca463d9d23561641a331be87aca46f54d..67efaa3c4dd6dd4148c64835458c1483289a251c 100644 --- a/doc/software-manual.tex +++ b/doc/software-manual.tex @@ -5943,6 +5943,18 @@ Specifies sii_num_units_in_shutter_interval for single entry.If multiple entries \Default{0} & Specifies the bottom offset of spatial extrapolation for the \emph{i}-th neural network post-filter. \\ + \Option{SEINNPFCAapplicationPurposeTagUriPresentFlag\emph{i}} & + \Default{false} & + Specifies the nnpfc_application_purpose_tag_uri_present_flag syntax element for the \emph{i}-th neural network post-filter. + \par + When true (non-zero) specifies the presence of the nnpfc_application_purpose_tag_uri syntax element in the NNPFC SEI message. + \par + When false specifies the absence of the nnpfc_application_purpose_tag_uri syntax element in the NNPFC SEI message. + \\ + \Option{SEINNPFCApplicationPurposeTagUri\emph{i}} & + \Default{""} & + specifies a tag URI with syntax and semantics as specified in IETF RFC 4151 identifying the application determined purpose of the NNPF, when nnpfc_purpose is equal to 0 of the \emph{i}-th neural network post-filter. + \\ \Option{SEINNPFCInputPicOutputFlag\emph{i}} & \Default{false} & Indicates whether the i-th neural network post filter generates a corresponding output picture for the i-th input picture. diff --git a/source/App/EncoderApp/EncApp.cpp b/source/App/EncoderApp/EncApp.cpp index 2c0af94e3b55a80bd89154f7edd239144ecce27b..d6a1911635732271141be1a3e944852d344b6e11 100644 --- a/source/App/EncoderApp/EncApp.cpp +++ b/source/App/EncoderApp/EncApp.cpp @@ -1293,6 +1293,13 @@ void EncApp::xInitLibCfg( int layerIdx ) m_cEncLib.setNNPostFilterSEICharacteristicsSpatialExtrapolationRightOffset (m_nnPostFilterSEICharacteristicsSpatialExtrapolationRightOffset[i], i); m_cEncLib.setNNPostFilterSEICharacteristicsSpatialExtrapolationTopOffset (m_nnPostFilterSEICharacteristicsSpatialExtrapolationTopOffset[i], i); m_cEncLib.setNNPostFilterSEICharacteristicsSpatialExtrapolationBottomOffset(m_nnPostFilterSEICharacteristicsSpatialExtrapolationBottomOffset[i], i); +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + m_cEncLib.setNNPostFilterSEICharacteristicsSpatialExtrapolationPromptPresentFlag( m_nnPostFilterSEICharacteristicsSpatialExtrapolationPromptPresentFlag[i], i); + if (m_cEncLib.getNNPostFilterSEICharacteristicsSpatialExtrapolationPromptPresentFlag(i)) + { + m_cEncLib.setNNPostFilterSEICharacteristicsSpatialExrapolationPrompt( m_nnPostFilterSEICharacteristicsSpatialExtrapolationPrompt[i], i); + } +#endif } #endif m_cEncLib.setNNPostFilterSEICharacteristicsAbsentInputPicZeroFlag (m_nnPostFilterSEICharacteristicsAbsentInputPicZeroFlag[i], i); diff --git a/source/App/EncoderApp/EncAppCfg.cpp b/source/App/EncoderApp/EncAppCfg.cpp index a5402d7bbac73a5cb4d959c00246547849eca9c9..7d7358608c759a876d8d30d478d962b903815fe1 100644 --- a/source/App/EncoderApp/EncAppCfg.cpp +++ b/source/App/EncoderApp/EncAppCfg.cpp @@ -2091,6 +2091,14 @@ bool EncAppCfg::parseCfg( int argc, char* argv[] ) std::ostringstream spatialExtrapolationBottomOffset; spatialExtrapolationBottomOffset << "SEINNPFCSpatialExtrapolationLeftOffset" << i; opts.addOptions()(spatialExtrapolationBottomOffset.str(), m_nnPostFilterSEICharacteristicsSpatialExtrapolationBottomOffset[i], 0, "Bottom offset of spatial extrapolation"); +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + std::ostringstream spatialextrapolationPromptPresentFlag; + spatialextrapolationPromptPresentFlag << "SEINNPFCSpatialExtrapolationPromptPresentFlag" << i; + opts.addOptions()(spatialextrapolationPromptPresentFlag.str(), m_nnPostFilterSEICharacteristicsSpatialExtrapolationPromptPresentFlag[i], false, "equal to 1 specifies that nnpfc_prompt syntax element is present and nnpfc_alignment_zero_bit_c syntax element may be present. nnpfc_spatial_extrapolation_prompt_present_flag equal to 0 specifies that nnpfc_prompt syntax element and nnpfc_alignment_zero_bit_c syntax element are not present."); + std::ostringstream spatialextrapolationPrompt; + spatialextrapolationPrompt << "SEINNPFCSpatialExtrapolationPrompt" << i; + opts.addOptions()(spatialextrapolationPrompt.str(), m_nnPostFilterSEICharacteristicsSpatialExtrapolationPrompt[i], std::string(""), "specifies the text string prompt used for generating the contents of the spatial extrapolation image area."); +#endif #endif std::ostringstream InputPicOutputFlag; InputPicOutputFlag << "SEINNPFCInputPicOutputFlag" << i; diff --git a/source/App/EncoderApp/EncAppCfg.h b/source/App/EncoderApp/EncAppCfg.h index 2b58fcea3abf2370a635d7d5341790d43b8008a4..850a8bb957e19f6cd990f14dd34a2639040ca467 100644 --- a/source/App/EncoderApp/EncAppCfg.h +++ b/source/App/EncoderApp/EncAppCfg.h @@ -841,6 +841,10 @@ protected: int32_t m_nnPostFilterSEICharacteristicsSpatialExtrapolationRightOffset[MAX_NUM_NN_POST_FILTERS]; int32_t m_nnPostFilterSEICharacteristicsSpatialExtrapolationTopOffset[MAX_NUM_NN_POST_FILTERS]; int32_t m_nnPostFilterSEICharacteristicsSpatialExtrapolationBottomOffset[MAX_NUM_NN_POST_FILTERS]; +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + bool m_nnPostFilterSEICharacteristicsSpatialExtrapolationPromptPresentFlag[MAX_NUM_NN_POST_FILTERS]; + std::string m_nnPostFilterSEICharacteristicsSpatialExtrapolationPrompt[MAX_NUM_NN_POST_FILTERS]; +#endif #endif std::vector<bool> m_nnPostFilterSEICharacteristicsInputPicOutputFlag[MAX_NUM_NN_POST_FILTERS]; bool m_nnPostFilterSEICharacteristicsAbsentInputPicZeroFlag[MAX_NUM_NN_POST_FILTERS]; diff --git a/source/Lib/CommonLib/SEI.cpp b/source/Lib/CommonLib/SEI.cpp index 4e9de5d13f85992ee27e246238546b5a54d8a2fd..ebff938ae6fda6ae9aa88ccfd8d964605cc2d07c 100644 --- a/source/Lib/CommonLib/SEI.cpp +++ b/source/Lib/CommonLib/SEI.cpp @@ -1020,6 +1020,10 @@ SEINeuralNetworkPostFilterCharacteristics::SEINeuralNetworkPostFilterCharacteris m_spatialExtrapolationRightOffset = sei.m_spatialExtrapolationRightOffset; m_spatialExtrapolationTopOffset = sei.m_spatialExtrapolationTopOffset; m_spatialExtrapolationBottomOffset = sei.m_spatialExtrapolationBottomOffset; +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + m_spatialExtrapolationPromptPresentFlag = sei.m_spatialExtrapolationPromptPresentFlag; + m_prompt = sei.m_prompt; +#endif #endif m_inputPicOutputFlag = sei.m_inputPicOutputFlag; } @@ -1088,6 +1092,10 @@ bool SEINeuralNetworkPostFilterCharacteristics::operator == (const SEINeuralNetw m_spatialExtrapolationRightOffset == sei.m_spatialExtrapolationRightOffset && m_spatialExtrapolationTopOffset == sei.m_spatialExtrapolationTopOffset && m_spatialExtrapolationBottomOffset == sei.m_spatialExtrapolationBottomOffset && +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + m_spatialExtrapolationPromptPresentFlag == sei.m_spatialExtrapolationPromptPresentFlag && + m_prompt == sei.m_prompt && +#endif #endif m_inputPicOutputFlag == sei.m_inputPicOutputFlag && m_payloadLength == sei.m_payloadLength; diff --git a/source/Lib/CommonLib/SEI.h b/source/Lib/CommonLib/SEI.h index 7486df67b20c6375968f28678befaff58cd4e543..f7e4fab5c6fd2bb2319793d32c32987670378ad5 100644 --- a/source/Lib/CommonLib/SEI.h +++ b/source/Lib/CommonLib/SEI.h @@ -1438,6 +1438,10 @@ public: , m_spatialExtrapolationRightOffset(0) , m_spatialExtrapolationTopOffset(0) , m_spatialExtrapolationBottomOffset(0) +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + , m_spatialExtrapolationPromptPresentFlag(false) + , m_prompt("") +#endif #endif , m_absentInputPicZeroFlag(false) , m_numInpPicsInOutputTensor(0) @@ -1525,6 +1529,10 @@ public: int32_t m_spatialExtrapolationRightOffset; int32_t m_spatialExtrapolationTopOffset; int32_t m_spatialExtrapolationBottomOffset; +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + bool m_spatialExtrapolationPromptPresentFlag; + std::string m_prompt; +#endif #endif std::vector<bool> m_inputPicOutputFlag; bool m_absentInputPicZeroFlag; diff --git a/source/Lib/CommonLib/TypeDef.h b/source/Lib/CommonLib/TypeDef.h index 0de9dfe13daf00b48b66c94ce2693ff5a0c62bb0..a38268d918b283c4a22aaf881222b30675f7dab9 100644 --- a/source/Lib/CommonLib/TypeDef.h +++ b/source/Lib/CommonLib/TypeDef.h @@ -70,6 +70,8 @@ #define JVET_AI0153_OMI_SEI 1 // JVET-AI0153: OMI-SEI Implementation as JVET-AH0346 +#define JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 1 //JVET-AI0061 proposal 1: signal a NNPFC prompt for spatial extrapolation + #define JVET_AI0061_PROPOSAL2_SPATIAL_EXTRAPOLATION 1 // JVET AI0061-Proposal2: Ensure spatial extrapolation works correctly (Option 1) //########### place macros to be be kept below this line ############### diff --git a/source/Lib/DecoderLib/SEIread.cpp b/source/Lib/DecoderLib/SEIread.cpp index c3d118e200aa20fe3b29cc64ee0ac9e5d09ac417..4ba50666278182d0ab3c8e5d272a0e4ae91b6c78 100644 --- a/source/Lib/DecoderLib/SEIread.cpp +++ b/source/Lib/DecoderLib/SEIread.cpp @@ -3225,6 +3225,21 @@ void SEIReader::xParseSEINNPostFilterCharacteristics(SEINeuralNetworkPostFilterC sei.m_spatialExtrapolationTopOffset = value; sei_read_svlc(pDecodedMessageOutputStream, value, "nnpfc_spatial_extrapolation_bottom_offset"); sei.m_spatialExtrapolationBottomOffset = value; +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + sei_read_flag(pDecodedMessageOutputStream, val, "nnpfc_spatial_extrapolation_prompt_present_flag"); + sei.m_spatialExtrapolationPromptPresentFlag = val; + if (sei.m_spatialExtrapolationPromptPresentFlag) + { + std::string valp; + while (!isByteAligned()) + { + sei_read_flag(pDecodedMessageOutputStream, val, "nnpfc_alignment_zero_bit_c"); + CHECK(val != 0, "nnpfc_alignment_zero_bit_c not equal to zero"); + } + sei_read_string(pDecodedMessageOutputStream, valp, "nnpfc_prompt"); + sei.m_prompt = valp; + } +#endif } #endif diff --git a/source/Lib/EncoderLib/EncCfg.h b/source/Lib/EncoderLib/EncCfg.h index f0ea7cad9f2d1e3998ba934cf07efbf30bda4cfe..4efc9342e74a99c7fb3420efb00cc3f4e2e14db4 100644 --- a/source/Lib/EncoderLib/EncCfg.h +++ b/source/Lib/EncoderLib/EncCfg.h @@ -778,6 +778,10 @@ protected: int32_t m_nnPostFilterSEICharacteristicsSpatialExtrapolationRightOffset[MAX_NUM_NN_POST_FILTERS]; int32_t m_nnPostFilterSEICharacteristicsSpatialExtrapolationTopOffset[MAX_NUM_NN_POST_FILTERS]; int32_t m_nnPostFilterSEICharacteristicsSpatialExtrapolationBottomOffset[MAX_NUM_NN_POST_FILTERS]; +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + bool m_nnPostFilterSEICharacteristicsSpatialExtrapolationPromptPresentFlag[MAX_NUM_NN_POST_FILTERS]; + std::string m_nnPostFilterSEICharacteristicsSpatialExtrapolationPrompt[MAX_NUM_NN_POST_FILTERS]; +#endif #endif std::vector<bool> m_nnPostFilterSEICharacteristicsInputPicOutputFlag[MAX_NUM_NN_POST_FILTERS]; bool m_nnPostFilterSEICharacteristicsAbsentInputPicZeroFlag[MAX_NUM_NN_POST_FILTERS]; @@ -2197,6 +2201,12 @@ public: int32_t getNNPostFilterSEICharacteristicsSpatialExtrapolationTopOffset(int filterIdx) { return m_nnPostFilterSEICharacteristicsSpatialExtrapolationTopOffset[filterIdx]; } void setNNPostFilterSEICharacteristicsSpatialExtrapolationBottomOffset(int32_t value, int filterIdx) { m_nnPostFilterSEICharacteristicsSpatialExtrapolationBottomOffset[filterIdx] = value; } int32_t getNNPostFilterSEICharacteristicsSpatialExtrapolationBottomOffset(int filterIdx) { return m_nnPostFilterSEICharacteristicsSpatialExtrapolationBottomOffset[filterIdx]; } +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + void setNNPostFilterSEICharacteristicsSpatialExtrapolationPromptPresentFlag(bool promptPresentFlag, int filterIdx) { m_nnPostFilterSEICharacteristicsSpatialExtrapolationPromptPresentFlag[filterIdx] = promptPresentFlag; } + bool getNNPostFilterSEICharacteristicsSpatialExtrapolationPromptPresentFlag(int filterIdx) const { return m_nnPostFilterSEICharacteristicsSpatialExtrapolationPromptPresentFlag[filterIdx]; } + void setNNPostFilterSEICharacteristicsSpatialExrapolationPrompt(std::string prompt, int filterIdx) { m_nnPostFilterSEICharacteristicsSpatialExtrapolationPrompt[filterIdx] = prompt; } + std::string getNNPostFilterSEICharacteristicsSpatialExrapolationPrompt(int filterIdx) const { return m_nnPostFilterSEICharacteristicsSpatialExtrapolationPrompt[filterIdx]; } +#endif #endif void setNNPostFilterSEICharacteristicsInputPicOutputFlag(std::vector<bool> value, int filterIdx) { m_nnPostFilterSEICharacteristicsInputPicOutputFlag[filterIdx] = value; } const std::vector<bool>& getNNPostFilterSEICharacteristicsInputPicOutputFlag(int filterIdx) { return m_nnPostFilterSEICharacteristicsInputPicOutputFlag[filterIdx]; } diff --git a/source/Lib/EncoderLib/SEIEncoder.cpp b/source/Lib/EncoderLib/SEIEncoder.cpp index 42689af050b955164033bb0e2426463a34022e1f..6d769158f10aa146fd1002d2c48152126222ff20 100644 --- a/source/Lib/EncoderLib/SEIEncoder.cpp +++ b/source/Lib/EncoderLib/SEIEncoder.cpp @@ -1662,6 +1662,13 @@ void SEIEncoder::initSEINeuralNetworkPostFilterCharacteristics(SEINeuralNetworkP sei->m_spatialExtrapolationRightOffset = m_pcCfg->getNNPostFilterSEICharacteristicsSpatialExtrapolationRightOffset(filterIdx); sei->m_spatialExtrapolationTopOffset = m_pcCfg->getNNPostFilterSEICharacteristicsSpatialExtrapolationTopOffset(filterIdx); sei->m_spatialExtrapolationBottomOffset = m_pcCfg->getNNPostFilterSEICharacteristicsSpatialExtrapolationBottomOffset(filterIdx); +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + sei->m_spatialExtrapolationPromptPresentFlag = m_pcCfg->getNNPostFilterSEICharacteristicsSpatialExtrapolationPromptPresentFlag(filterIdx); + if (sei->m_spatialExtrapolationPromptPresentFlag) + { + sei->m_prompt = m_pcCfg->getNNPostFilterSEICharacteristicsSpatialExrapolationPrompt(filterIdx); + } +#endif } #endif diff --git a/source/Lib/EncoderLib/SEIwrite.cpp b/source/Lib/EncoderLib/SEIwrite.cpp index 5ccaf963d78fecc047461c5b0b7c330355d2fb4e..762cecda07cf44f9092b02e82f6cc77baa091396 100644 --- a/source/Lib/EncoderLib/SEIwrite.cpp +++ b/source/Lib/EncoderLib/SEIwrite.cpp @@ -1938,6 +1938,17 @@ void SEIWriter::xWriteSEINeuralNetworkPostFilterCharacteristics(const SEINeuralN xWriteSvlc(sei.m_spatialExtrapolationRightOffset, "nnpfc_spatial_extrapolation_right_offset"); xWriteSvlc(sei.m_spatialExtrapolationTopOffset, "nnpfc_spatial_extrapolation_top_offset"); xWriteSvlc(sei.m_spatialExtrapolationBottomOffset, "nnpfc_spatial_extrapolation_right_offset"); +#if JVET_AI0061_SPATIAL_EXTRAPOLATION_PROPOSAL1 + xWriteFlag(sei.m_spatialExtrapolationPromptPresentFlag, "nnpfc_spatial_extrapolation_prompt_present_flag"); + if (sei.m_spatialExtrapolationPromptPresentFlag) + { + while (!isByteAligned()) + { + xWriteFlag(0, "nnpfc_alignment_zero_bit_c"); + } + xWriteString(sei.m_prompt, "nnpfc_prompt"); + } +#endif } #endif