2022-05-01 00:33:22 -05:00

287 lines
9.4 KiB
C#

using System;
using System.Collections.Generic;
using System.Threading;
using System.Threading.Tasks;
using MediaBrowser.Model.Tasks;
using Microsoft.Extensions.Logging;
namespace ConfusedPolarBear.Plugin.IntroSkipper;
/// <summary>
/// Fingerprint all queued episodes at the set time.
/// </summary>
public class FingerprinterTask : IScheduledTask {
private readonly ILogger<FingerprinterTask> _logger;
/// <summary>
/// Minimum time (in seconds) for a contiguous time range to be considered an introduction.
/// </summary>
private const int MINIMUM_INTRO_DURATION = 18;
/// <summary>
/// Maximum number of bits (out of 32 total) that can be different between segments before they are considered dissimilar.
/// </summary>
private const double MAXIMUM_DIFFERENCES = 5;
/// <summary>
/// Maximum time permitted between timestamps before they are considered non-contiguous.
/// </summary>
private const double MAXIMUM_DISTANCE = 3.25;
/// <summary>
/// Seconds of audio in one number from the fingerprint. Defined by Chromaprint.
/// </summary>
private const double SAMPLES_TO_SECONDS = 0.128;
/// <summary>
/// Constructor.
/// </summary>
public FingerprinterTask(ILogger<FingerprinterTask> logger)
{
_logger = logger;
_logger.LogInformation("Fingerprinting Task Scheduled!");
}
/// <summary>
/// Task name.
/// </summary>
public string Name => "Analyze episodes";
/// <summary>
/// Task category.
/// </summary>
public string Category => "Intro Skipper";
/// <summary>
/// Task description.
/// </summary>
public string Description => "Analyzes the audio of all television episodes to find introduction sequences.";
/// <summary>
/// Key.
/// </summary>
public string Key => "CPBIntroSkipperRunFingerprinter";
/// <summary>
/// Analyze all episodes in the queue.
/// </summary>
/// <param name="progress">Progress.</param>
/// <param name="cancellationToken">Cancellation token.</param>
public Task ExecuteAsync(IProgress<double> progress, CancellationToken cancellationToken)
{
var queue = Plugin.Instance!.AnalysisQueue;
var totalProcessed = 0;
foreach (var season in queue) {
var first = season.Value[0];
_logger.LogDebug(
"Fingerprinting {Count} episodes from {Name} season {Season}",
season.Value.Count,
first.SeriesName,
first.SeasonNumber);
// Ensure there are an even number of episodes
var episodes = season.Value;
if (episodes.Count % 2 != 0) {
episodes.Add(episodes[episodes.Count - 2]);
}
for (var i = 0; i < episodes.Count; i += 2)
{
var lhs = episodes[i];
var rhs = episodes[i+1];
// FIXME: add retry logic
var alreadyDone = Plugin.Instance!.Intros;
if (alreadyDone.ContainsKey(lhs.EpisodeId) && alreadyDone.ContainsKey(rhs.EpisodeId))
{
_logger.LogDebug(
"Episodes {LHS} and {RHS} have both already been fingerprinted",
lhs.EpisodeId,
rhs.EpisodeId);
continue;
}
try
{
FingerprintEpisodes(lhs, rhs);
}
catch (FingerprintException ex)
{
_logger.LogError("Caught fingerprint error: {Ex}", ex);
}
finally
{
totalProcessed += 2;
progress.Report((totalProcessed * 100) / Plugin.Instance!.TotalQueued);
}
}
// TODO: after every season completes, serialize fingerprints to disk somewhere
}
return Task.CompletedTask;
}
private void FingerprintEpisodes(QueuedEpisode lhsEpisode, QueuedEpisode rhsEpisode)
{
var lhs = FPCalc.Fingerprint(lhsEpisode);
var rhs = FPCalc.Fingerprint(rhsEpisode);
var lhsRanges = new List<TimeRange>();
var rhsRanges = new List<TimeRange>();
// Compare all elements of the shortest fingerprint to the other fingerprint.
var high = Math.Min(lhs.Count, rhs.Count);
// TODO: see if bailing out early results in false positives.
for (var amount = -1 * high; amount < high; amount++) {
var leftOffset = 0;
var rightOffset = 0;
// Calculate the offsets for the left and right hand sides.
if (amount < 0) {
leftOffset -= amount;
} else {
rightOffset += amount;
}
// Store similar times for both LHS and RHS.
var lhsTimes = new List<double>();
var rhsTimes = new List<double>();
// XOR all elements in LHS and RHS, using the shift amount from above.
for (var i = 0; i < high - Math.Abs(amount); i++) {
// XOR both samples at the current position.
var lhsPosition = i + leftOffset;
var rhsPosition = i + rightOffset;
var diff = lhs[lhsPosition] ^ rhs[rhsPosition];
// If the difference between the samples is small (< 5/32), flag both times as similar.
if (countBits(diff) > MAXIMUM_DIFFERENCES)
{
continue;
}
var lhsTime = lhsPosition * SAMPLES_TO_SECONDS;
var rhsTime = rhsPosition * SAMPLES_TO_SECONDS;
lhsTimes.Add(lhsTime);
rhsTimes.Add(rhsTime);
}
// Ensure the last timestamp is checked
lhsTimes.Add(Double.MaxValue);
rhsTimes.Add(Double.MaxValue);
// Now that both fingerprints have been compared at this shift, see if there's a contiguous time range.
var lContiguous = TimeRangeHelpers.FindContiguous(lhsTimes.ToArray(), MAXIMUM_DISTANCE);
if (lContiguous is null || lContiguous.Duration < MINIMUM_INTRO_DURATION)
{
continue;
}
// Since LHS had a contiguous time range, RHS must have one also.
var rContiguous = TimeRangeHelpers.FindContiguous(rhsTimes.ToArray(), MAXIMUM_DISTANCE)!;
// Tweak the end timestamps just a bit to ensure as little content as possible is skipped over.
if (lContiguous.Duration >= 90)
{
lContiguous.End -= 6;
rContiguous.End -= 6;
}
else if (lContiguous.Duration >= 35)
{
lContiguous.End -= 3;
rContiguous.End -= 3;
}
// Store the ranges for later.
lhsRanges.Add(lContiguous);
rhsRanges.Add(rContiguous);
}
if (lhsRanges.Count == 0)
{
_logger.LogDebug(
"Unable to find a shared introduction sequence between {LHS} and {RHS}",
lhsEpisode.Path,
rhsEpisode.Path);
// TODO: if an episode fails but others in the season succeed, reanalyze it against two that succeeded.
// TODO: is this the optimal way to indicate that an intro couldn't be found?
// the goal here is to not waste time every task run reprocessing episodes that we know will fail.
storeIntro(lhsEpisode.EpisodeId, 0, 0);
storeIntro(rhsEpisode.EpisodeId, 0, 0);
return;
}
// After comparing both episodes at all possible shift positions, store the longest time range as the intro.
lhsRanges.Sort();
rhsRanges.Sort();
var lhsIntro = lhsRanges[0];
var rhsIntro = rhsRanges[0];
// Do a tiny bit of post processing and store the results.
if (lhsIntro.Start <= 5)
{
lhsIntro.Start = 0;
}
if (rhsIntro.Start <= 5)
{
rhsIntro.Start = 0;
}
storeIntro(lhsEpisode.EpisodeId, lhsIntro.Start, lhsIntro.End);
storeIntro(rhsEpisode.EpisodeId, rhsIntro.Start, rhsIntro.End);
}
private static void storeIntro(Guid episode, double introStart, double introEnd)
{
// Recommend that the skip button appears 5 seconds ahead of the intro
// and that it disappears 10 seconds after the intro begins.
Plugin.Instance!.Intros[episode] = new Intro()
{
Valid = (introStart > 0) && (introEnd > 0),
IntroStart = introStart,
IntroEnd = introEnd,
ShowSkipPromptAt = Math.Min(0, introStart - 5),
HideSkipPromptAt = introStart + 10
};
}
private static int countBits(uint number) {
var count = 0;
for (var i = 0; i < 32; i++) {
var low = (number >> i) & 1;
if (low == 1) {
count++;
}
}
return count;
}
/// <summary>
/// Get task triggers.
/// </summary>
public IEnumerable<TaskTriggerInfo> GetDefaultTriggers()
{
return new[]
{
new TaskTriggerInfo
{
Type = TaskTriggerInfo.TriggerDaily,
TimeOfDayTicks = TimeSpan.FromDays(24).Ticks
}
};
}
}