1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
use std::sync::Arc;

use crate::{
  api::lookahead::{
    estimate_importance_block_difference, estimate_inter_costs,
    estimate_intra_costs,
  },
  frame::Frame,
  me::FrameMEStats,
};
use v_frame::{math::Fixed, pixel::Pixel};

use super::{SceneChangeDetector, ScenecutResult};

impl<T: Pixel> SceneChangeDetector<T> {
  /// Run a comparison between two frames to determine if they qualify for a scenecut.
  ///
  /// We gather both intra and inter costs for the frames,
  /// as well as an importance-block-based difference,
  /// and use all three metrics.
  pub(super) fn cost_scenecut(
    &mut self, frame1: Arc<Frame<T>>, frame2: Arc<Frame<T>>,
    input_frameno: u64,
  ) -> ScenecutResult {
    let frame2_inter_ref = Arc::clone(&frame2);
    let frame1_imp_ref = Arc::clone(&frame1);
    let frame2_imp_ref = Arc::clone(&frame2);

    let mut intra_cost = 0.0;
    let mut mv_inter_cost = 0.0;
    let mut imp_block_cost = 0.0;

    let cols = 2 * self.encoder_config.width.align_power_of_two_and_shift(3);
    let rows = 2 * self.encoder_config.height.align_power_of_two_and_shift(3);

    let buffer = if let Some(buffer) = &self.frame_me_stats_buffer {
      Arc::clone(buffer)
    } else {
      let frame_me_stats = FrameMEStats::new_arc_array(cols, rows);
      let clone = Arc::clone(&frame_me_stats);
      self.frame_me_stats_buffer = Some(frame_me_stats);
      clone
    };

    rayon::scope(|s| {
      s.spawn(|_| {
        let temp_plane =
          self.temp_plane.get_or_insert_with(|| frame2.planes[0].clone());

        let intra_costs =
          self.intra_costs.entry(input_frameno).or_insert_with(|| {
            estimate_intra_costs(
              temp_plane,
              &*frame2,
              self.bit_depth,
              self.cpu_feature_level,
            )
          });

        intra_cost = intra_costs.iter().map(|&cost| cost as u64).sum::<u64>()
          as f64
          / intra_costs.len() as f64;
        // If we're not using temporal RDO, we won't need these costs later,
        // so remove them from the cache to avoid a memory leak
        if !self.encoder_config.temporal_rdo() {
          self.intra_costs.remove(&input_frameno);
        };
      });
      s.spawn(|_| {
        mv_inter_cost = estimate_inter_costs(
          frame2_inter_ref,
          frame1,
          self.bit_depth,
          self.encoder_config.clone(),
          self.sequence.clone(),
          buffer,
        );
      });
      s.spawn(|_| {
        imp_block_cost =
          estimate_importance_block_difference(frame2_imp_ref, frame1_imp_ref);
      });
    });

    // `BIAS` determines how likely we are
    // to choose a keyframe, between 0.0-1.0.
    // Higher values mean we are more likely to choose a keyframe.
    // This value was chosen based on trials using the new
    // adaptive scenecut code.
    const BIAS: f64 = 0.7;
    let threshold = intra_cost * (1.0 - BIAS);

    ScenecutResult {
      inter_cost: mv_inter_cost,
      imp_block_cost,
      threshold,
      backward_adjusted_cost: 0.0,
      forward_adjusted_cost: 0.0,
    }
  }
}