[x265] [PATCH] Disable fall-back on traditional scenecut algorithm with --hist-scenecut
Aruna Matheswaran
aruna at multicorewareinc.com
Fri Jul 30 08:47:55 UTC 2021
On Thu, Jun 24, 2021 at 2:18 PM Pooja Venkatesan <pooja at multicorewareinc.com>
wrote:
> From f6c1b86d99ab3a0dd57204f930e526a07e28fed7 Mon Sep 17 00:00:00 2001
> From: Praveen Karadugattu <praveenkumar at multicorewareinc.com>
> Date: Sun, 20 Jun 2021 21:20:50 +0530
> Subject: [PATCH] Disable fall-back on traditional scenecut algorithm with
> --hist-scenecut
>
> ---
> doc/reST/cli.rst | 9 +++++++--
> source/CMakeLists.txt | 2 +-
> source/common/param.cpp | 8 +++++++-
> source/encoder/encoder.cpp | 17 ++++++++++++-----
> source/encoder/slicetype.cpp | 15 ++++++++++-----
> source/test/regression-tests.txt | 1 +
> source/x265.h | 4 ++++
> source/x265cli.h | 1 +
> 8 files changed, 43 insertions(+), 14 deletions(-)
>
> diff --git a/doc/reST/cli.rst b/doc/reST/cli.rst
> index 4154221af..280b734b3 100755
> --- a/doc/reST/cli.rst
> +++ b/doc/reST/cli.rst
> @@ -1470,7 +1470,8 @@ Slice decision options
> .. option:: --hist-scenecut, --no-hist-scenecut
>
> Indicates that scenecuts need to be detected using luma edge and chroma
> histograms.
> - :option:`--hist-scenecut` enables scenecut detection using the
> histograms and disables the default scene cut algorithm.
> + :option:`--hist-scenecut` enables scenecut detection using the
> histograms.
> + It also uses the intra and inter cost info to arrive at a scenecut
> decision from the default scenecut method.
> :option:`--no-hist-scenecut` disables histogram based scenecut algorithm.
>
> .. option:: --hist-threshold <0.0..1.0>
> @@ -1480,7 +1481,11 @@ Slice decision options
> greater than 0.2 against the previous frame as scenecut.
> Increasing the threshold reduces the number of scenecuts detected.
> Default 0.03.
> -
> +
> +.. option:: --disable-traditional-scenecut
> +
> + Indicates that the usage of traditional scenecut detection using intra
> and inter cost should be disabled when :option:`--hist-scenecut` is used.
> +
> .. option:: --radl <integer>
>
> Number of RADL pictures allowed infront of IDR. Requires closed gop
> interval.
> diff --git a/source/CMakeLists.txt b/source/CMakeLists.txt
> index b4e57b592..f4a9cb793 100755
> --- a/source/CMakeLists.txt
> +++ b/source/CMakeLists.txt
> @@ -29,7 +29,7 @@ option(NATIVE_BUILD "Target the build CPU" OFF)
> option(STATIC_LINK_CRT "Statically link C runtime for release builds" OFF)
> mark_as_advanced(FPROFILE_USE FPROFILE_GENERATE NATIVE_BUILD)
> # X265_BUILD must be incremented each time the public API is changed
> -set(X265_BUILD 200)
> +set(X265_BUILD 201)
> configure_file("${PROJECT_SOURCE_DIR}/x265.def.in"
> "${PROJECT_BINARY_DIR}/x265.def")
> configure_file("${PROJECT_SOURCE_DIR}/x265_config.h.in"
> diff --git a/source/common/param.cpp b/source/common/param.cpp
> index 8a27aaef3..3b84415c3 100755
> --- a/source/common/param.cpp
> +++ b/source/common/param.cpp
> @@ -172,6 +172,7 @@ void x265_param_default(x265_param* param)
> param->scenecutThreshold = 40; /* Magic number pulled in from x264 */
> param->edgeTransitionThreshold = 0.03;
> param->bHistBasedSceneCut = 0;
> + param->bDisableTradScdInHscd = 0;
> param->lookaheadSlices = 8;
> param->lookaheadThreads = 0;
> param->scenecutBias = 5.0;
> @@ -598,6 +599,7 @@ int x265_param_default_preset(x265_param* param, const
> char* preset, const char*
> param->lookaheadDepth = 0;
> param->scenecutThreshold = 0;
> param->bHistBasedSceneCut = 0;
> + param->bDisableTradScdInHscd = 0;
> param->rc.cuTree = 0;
> param->frameNumThreads = 1;
> }
> @@ -953,6 +955,7 @@ int x265_param_parse(x265_param* p, const char* name,
> const char* value)
> bError = false;
> p->scenecutThreshold = atoi(value);
> p->bHistBasedSceneCut = 0;
> + p->bDisableTradScdInHscd = 0;
> }
> }
> OPT("temporal-layers") p->bEnableTemporalSubLayers = atobool(value);
> @@ -1234,6 +1237,7 @@ int x265_param_parse(x265_param* p, const char*
> name, const char* value)
> }
> }
> OPT("hist-threshold") p->edgeTransitionThreshold = atof(value);
> + OPT("disable-traditional-scenecut") p->bDisableTradScdInHscd =
> atobool(value);
> OPT("rskip-edge-threshold") p->edgeVarThreshold =
> atoi(value)/100.0f;
> OPT("lookahead-threads") p->lookaheadThreads = atoi(value);
> OPT("opt-cu-delta-qp") p->bOptCUDeltaQP = atobool(value);
> @@ -2151,7 +2155,8 @@ char *x265_param2string(x265_param* p, int padx, int
> pady)
> s += sprintf(s, " rc-lookahead=%d", p->lookaheadDepth);
> s += sprintf(s, " lookahead-slices=%d", p->lookaheadSlices);
> s += sprintf(s, " scenecut=%d", p->scenecutThreshold);
> - s += sprintf(s, " hist-scenecut=%d", p->bHistBasedSceneCut);
> + BOOL(p->bHistBasedSceneCut, "hist-scenecut");
> + BOOL(p->bDisableTradScdInHscd, "disable-traditional-scenecut");
>
[AM] This will add invalid CLI option "no-disable-traditional-scenecut" to
info-sei. Please fix this.
> s += sprintf(s, " radl=%d", p->radl);
> BOOL(p->bEnableHRDConcatFlag, "splice");
> BOOL(p->bIntraRefresh, "intra-refresh");
> @@ -2467,6 +2472,7 @@ void x265_copy_params(x265_param* dst, x265_param*
> src)
> dst->lookaheadThreads = src->lookaheadThreads;
> dst->scenecutThreshold = src->scenecutThreshold;
> dst->bHistBasedSceneCut = src->bHistBasedSceneCut;
> + dst->bDisableTradScdInHscd = src->bDisableTradScdInHscd;
> dst->bIntraRefresh = src->bIntraRefresh;
> dst->maxCUSize = src->maxCUSize;
> dst->minCUSize = src->minCUSize;
> diff --git a/source/encoder/encoder.cpp b/source/encoder/encoder.cpp
> index c1e1cb46d..dfb872889 100644
> --- a/source/encoder/encoder.cpp
> +++ b/source/encoder/encoder.cpp
> @@ -3680,6 +3680,7 @@ void Encoder::configure(x265_param *p)
> p->keyframeMax = INT_MAX;
> p->scenecutThreshold = 0;
> p->bHistBasedSceneCut = 0;
> + p->bDisableTradScdInHscd = 0;
> }
> else if (p->keyframeMax <= 1)
> {
> @@ -3694,6 +3695,7 @@ void Encoder::configure(x265_param *p)
> p->bframes = 0;
> p->scenecutThreshold = 0;
> p->bHistBasedSceneCut = 0;
> + p->bDisableTradScdInHscd = 0;
> p->bFrameAdaptive = 0;
> p->rc.cuTree = 0;
> p->bEnableWeightedPred = 0;
> @@ -4421,12 +4423,17 @@ void Encoder::configure(x265_param *p)
> m_param->searchRange = m_param->hmeRange[2];
> }
>
> - if (p->bHistBasedSceneCut && !p->edgeTransitionThreshold)
> - {
> - p->edgeTransitionThreshold = 0.03;
> - x265_log(p, X265_LOG_WARNING, "using default threshold %.2lf for
> scene cut detection\n", p->edgeTransitionThreshold);
> - }
> + if (p->bHistBasedSceneCut && !p->edgeTransitionThreshold)
> + {
> + p->edgeTransitionThreshold = 0.03;
> + x265_log(p, X265_LOG_WARNING, "using default threshold %.2lf for
> scene cut detection.\n", p->edgeTransitionThreshold);
> + }
>
> + if (!p->bHistBasedSceneCut && p->bDisableTradScdInHscd)
> + {
> + p->bDisableTradScdInHscd = 0;
> + x265_log(p, X265_LOG_WARNING, "option
> --disable-traditional-scenecut requires --hist-scenecut to be enabled.\n");
> + }
> }
>
> void Encoder::readAnalysisFile(x265_analysis_data* analysis, int curPoc,
> const x265_picture* picIn, int paramBytes)
> diff --git a/source/encoder/slicetype.cpp b/source/encoder/slicetype.cpp
> index 0adb0d0db..ace3b5469 100644
> --- a/source/encoder/slicetype.cpp
> +++ b/source/encoder/slicetype.cpp
> @@ -2014,7 +2014,7 @@ void Lookahead::slicetypeAnalyse(Lowres **frames,
> bool bKeyframe)
> bool isScenecut = false;
>
> /* Temporal computations for scenecut detection */
> - if (m_param->bHistBasedSceneCut)
> + if (m_param->bHistBasedSceneCut && !m_param->bDisableTradScdInHscd)
> {
> for (int i = numFrames - 1; i > 0; i--)
> {
> @@ -2047,8 +2047,10 @@ void Lookahead::slicetypeAnalyse(Lowres **frames,
> bool bKeyframe)
> }
>
> /* When scenecut threshold is set, use scenecut detection for I frame
> placements */
> - if (!m_param->bHistBasedSceneCut || (m_param->bHistBasedSceneCut &&
> frames[1]->bScenecut))
> + if (!m_param->bHistBasedSceneCut || (m_param->bHistBasedSceneCut &&
> !m_param->bDisableTradScdInHscd && frames[1]->bScenecut))
> isScenecut = scenecut(frames, 0, 1, true, origNumFrames);
> + else if (m_param->bHistBasedSceneCut && frames[1]->bScenecut)
> + isScenecut = true;
>
> if (isScenecut && (m_param->bHistBasedSceneCut ||
> m_param->scenecutThreshold))
> {
> @@ -2061,14 +2063,17 @@ void Lookahead::slicetypeAnalyse(Lowres **frames,
> bool bKeyframe)
> m_extendGopBoundary = false;
> for (int i = m_param->bframes + 1; i < origNumFrames; i +=
> m_param->bframes + 1)
> {
> - if (!m_param->bHistBasedSceneCut ||
> (m_param->bHistBasedSceneCut && frames[i + 1]->bScenecut))
> + if (!m_param->bHistBasedSceneCut ||
> (m_param->bHistBasedSceneCut && !m_param->bDisableTradScdInHscd && frames[i
> + 1]->bScenecut))
> scenecut(frames, i, i + 1, true, origNumFrames);
>
> for (int j = i + 1; j <= X265_MIN(i + m_param->bframes + 1,
> origNumFrames); j++)
> {
> - if (frames[j]->bScenecut && scenecutInternal(frames, j -
> 1, j, true))
> + if (frames[j]->bScenecut)
> {
> - m_extendGopBoundary = true;
> + if (!m_param->bDisableTradScdInHscd)
> + m_extendGopBoundary = scenecutInternal(frames, j
> - 1, j, true);
> + else
> + m_extendGopBoundary = true;
> break;
> }
> }
> diff --git a/source/test/regression-tests.txt
> b/source/test/regression-tests.txt
> index 971c854df..828157cab 100644
> --- a/source/test/regression-tests.txt
> +++ b/source/test/regression-tests.txt
> @@ -160,6 +160,7 @@ Traffic_4096x2048_30p.y4m, --preset medium --frame-dup
> --dup-threshold 60 --hrd
> Kimono1_1920x1080_24_400.yuv,--preset superfast --qp 28 --zones 0,139,q=32
> sintel_trailer_2k_1920x1080_24.yuv, --preset medium --hist-scenecut
> --hist-threshold 0.02 --frame-dup --dup-threshold 60 --hrd --bitrate 10000
> --vbv-bufsize 15000 --vbv-maxrate 12000
> sintel_trailer_2k_1920x1080_24.yuv, --preset medium --hist-scenecut
> --hist-threshold 0.02
> +sintel_trailer_2k_1920x1080_24.yuv, --preset medium --hist-scenecut
> --hist-threshold 0.02 --disable-traditional-scenecut
> sintel_trailer_2k_1920x1080_24.yuv, --preset ultrafast --hist-scenecut
> --hist-threshold 0.02
> crowd_run_1920x1080_50.yuv, --preset faster --ctu 32 --rskip 2
> --rskip-edge-threshold 5
> crowd_run_1920x1080_50.yuv, --preset fast --ctu 64 --rskip 2
> --rskip-edge-threshold 5 --aq-mode 4
> diff --git a/source/x265.h b/source/x265.h
> index 324f3163f..3a65fdda6 100644
> --- a/source/x265.h
> +++ b/source/x265.h
> @@ -1963,6 +1963,10 @@ typedef struct x265_param
> /* Flag indicating whether the encoder should emit an End of Sequence
> * NAL at the end of every Coded Video Sequence. Default false */
> int bEnableEndOfSequence;
> +
> + /* Flag to turn off traditional scenecut detection in histogram based
> scenecut detection so that
> + * only spatial properties are used for scenecut detection. Default
> false */
> + int bDisableTradScdInHscd;
> } x265_param;
>
> /* x265_param_alloc:
> diff --git a/source/x265cli.h b/source/x265cli.h
> index 46a2b68ae..86136fbfb 100644
> --- a/source/x265cli.h
> +++ b/source/x265cli.h
> @@ -144,6 +144,7 @@ static const struct option long_options[] =
> { "hist-scenecut", no_argument, NULL, 0},
> { "no-hist-scenecut", no_argument, NULL, 0},
> { "hist-threshold", required_argument, NULL, 0},
> + { "disable-traditional-scenecut", no_argument, NULL, 0},
> { "fades", no_argument, NULL, 0 },
> { "no-fades", no_argument, NULL, 0 },
> { "scenecut-aware-qp", required_argument, NULL, 0 },
> --
> 2.24.0.windows.2
>
> Regards,
> *Pooja Venkatesan*,
> Video Codec Engineer,
> Media & AI analytics BU
>
> _______________________________________________
> x265-devel mailing list
> x265-devel at videolan.org
> https://mailman.videolan.org/listinfo/x265-devel
>
--
Regards,
*Aruna Matheswaran,*
Video Codec Engineer,
Media & AI analytics BU,
-------------- next part --------------
An HTML attachment was scrubbed...
URL: <http://mailman.videolan.org/pipermail/x265-devel/attachments/20210730/8bcd4778/attachment-0001.html>
More information about the x265-devel
mailing list