Implement inverted indexes
This commit is contained in:
parent
3a4e688376
commit
749ca9dcda
@ -2,6 +2,8 @@
|
|||||||
* which supports both chromaprint and the "-fp_format raw" flag.
|
* which supports both chromaprint and the "-fp_format raw" flag.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
using System.Collections.Generic;
|
||||||
|
using System.Collections.ObjectModel;
|
||||||
using Xunit;
|
using Xunit;
|
||||||
using Microsoft.Extensions.Logging;
|
using Microsoft.Extensions.Logging;
|
||||||
|
|
||||||
@ -61,6 +63,26 @@ public class TestAudioFingerprinting
|
|||||||
Assert.Equal(expected, actual);
|
Assert.Equal(expected, actual);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
[Fact]
|
||||||
|
public void TestIndexGeneration()
|
||||||
|
{
|
||||||
|
// 0 1 2 3 4 5 6 7
|
||||||
|
var fpr = new List<uint>(new uint[] { 1, 2, 3, 1, 5, 77, 42, 2 }).AsReadOnly();
|
||||||
|
var expected = new Dictionary<uint, Collection<uint>>()
|
||||||
|
{
|
||||||
|
{1, new Collection<uint>{ 0, 3 } },
|
||||||
|
{2, new Collection<uint>{ 1, 7 } },
|
||||||
|
{3, new Collection<uint>{ 2 } },
|
||||||
|
{5, new Collection<uint>{ 4 } },
|
||||||
|
{42, new Collection<uint>{ 6 } },
|
||||||
|
{77, new Collection<uint>{ 5 } },
|
||||||
|
};
|
||||||
|
|
||||||
|
var actual = Chromaprint.CreateInvertedIndex(fpr);
|
||||||
|
|
||||||
|
Assert.Equal(expected, actual);
|
||||||
|
}
|
||||||
|
|
||||||
[Fact]
|
[Fact]
|
||||||
public void TestIntroDetection()
|
public void TestIntroDetection()
|
||||||
{
|
{
|
||||||
@ -76,8 +98,8 @@ public class TestAudioFingerprinting
|
|||||||
Assert.Equal(17.792, lhs.IntroEnd);
|
Assert.Equal(17.792, lhs.IntroEnd);
|
||||||
|
|
||||||
Assert.True(rhs.Valid);
|
Assert.True(rhs.Valid);
|
||||||
Assert.Equal(0, rhs.IntroStart);
|
Assert.Equal(5.12, rhs.IntroStart);
|
||||||
Assert.Equal(22.656, rhs.IntroEnd);
|
Assert.Equal(22.912, rhs.IntroEnd);
|
||||||
}
|
}
|
||||||
|
|
||||||
private QueuedEpisode queueEpisode(string path)
|
private QueuedEpisode queueEpisode(string path)
|
||||||
|
@ -109,6 +109,30 @@ public static class Chromaprint
|
|||||||
return results.AsReadOnly();
|
return results.AsReadOnly();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// <summary>
|
||||||
|
/// Transforms a Chromaprint into an inverted index of fingerprint points to the indexes they appeared at.
|
||||||
|
/// </summary>
|
||||||
|
/// <param name="fingerprint">Chromaprint fingerprint.</param>
|
||||||
|
/// <returns>Inverted index.</returns>
|
||||||
|
public static Dictionary<uint, Collection<uint>> CreateInvertedIndex(ReadOnlyCollection<uint> fingerprint)
|
||||||
|
{
|
||||||
|
var invIndex = new Dictionary<uint, Collection<uint>>();
|
||||||
|
|
||||||
|
for (int i = 0; i < fingerprint.Count; i++)
|
||||||
|
{
|
||||||
|
// Get the current point.
|
||||||
|
var point = fingerprint[i];
|
||||||
|
|
||||||
|
// Create a new collection for points of this value if it doesn't exist already.
|
||||||
|
invIndex.TryAdd(point, new Collection<uint>());
|
||||||
|
|
||||||
|
// Append the current sample's timecode to the collection for this point.
|
||||||
|
invIndex[point].Add((uint)i);
|
||||||
|
}
|
||||||
|
|
||||||
|
return invIndex;
|
||||||
|
}
|
||||||
|
|
||||||
/// <summary>
|
/// <summary>
|
||||||
/// Runs ffmpeg and returns standard output.
|
/// Runs ffmpeg and returns standard output.
|
||||||
/// </summary>
|
/// </summary>
|
||||||
|
@ -106,7 +106,7 @@
|
|||||||
</div>
|
</div>
|
||||||
|
|
||||||
<details id="statistics">
|
<details id="statistics">
|
||||||
<summary>Analysis Statistics</summary>
|
<summary>Analysis Statistics (experimental)</summary>
|
||||||
|
|
||||||
<pre id="statisticsText" style="font-size: larger"></p>
|
<pre id="statisticsText" style="font-size: larger"></p>
|
||||||
</details>
|
</details>
|
||||||
@ -239,7 +239,7 @@
|
|||||||
|
|
||||||
// Blank any old statistics
|
// Blank any old statistics
|
||||||
const text = document.querySelector("pre#statisticsText");
|
const text = document.querySelector("pre#statisticsText");
|
||||||
text.textContent = "";
|
text.textContent = "All CPU times are displayed as seconds.\n\n";
|
||||||
|
|
||||||
Dashboard.showLoadingMsg();
|
Dashboard.showLoadingMsg();
|
||||||
|
|
||||||
@ -247,14 +247,15 @@
|
|||||||
let stats = await getJson("Intros/Statistics");
|
let stats = await getJson("Intros/Statistics");
|
||||||
|
|
||||||
// Select which fields to print and label them with more friendly descriptions
|
// Select which fields to print and label them with more friendly descriptions
|
||||||
let fields = "TotalCPUTime,FingerprintCPUTime,FirstPassCPUTime,SecondPassCPUTime,QuickScans,FullScans," +
|
let fields = "TotalCPUTime,FingerprintCPUTime,FirstPassCPUTime,SecondPassCPUTime,IndexSearches," +
|
||||||
"TotalQueuedEpisodes";
|
"QuickScans,FullScans,TotalQueuedEpisodes";
|
||||||
|
|
||||||
let friendlyNames = {
|
let friendlyNames = {
|
||||||
TotalCPUTime: "Total CPU time (ms)",
|
TotalCPUTime: "Total CPU time",
|
||||||
FingerprintCPUTime: "Fingerprint time (ms)",
|
FingerprintCPUTime: "Fingerprint CPU time",
|
||||||
FirstPassCPUTime: "First pass (ms)",
|
FirstPassCPUTime: "First pass CPU time",
|
||||||
SecondPassCPUTime: "Second pass (ms)",
|
SecondPassCPUTime: "Second pass CPU time",
|
||||||
|
IndexSearches: "Index searches",
|
||||||
QuickScans: "Quick scans",
|
QuickScans: "Quick scans",
|
||||||
FullScans: "Full scans",
|
FullScans: "Full scans",
|
||||||
TotalQueuedEpisodes: "Episodes queued",
|
TotalQueuedEpisodes: "Episodes queued",
|
||||||
@ -262,9 +263,25 @@
|
|||||||
|
|
||||||
// Print all friendly names and data points
|
// Print all friendly names and data points
|
||||||
for (var f of fields.split(",")) {
|
for (var f of fields.split(",")) {
|
||||||
text.textContent += friendlyNames[f].padEnd(25) + stats[f] + "\n";
|
let name = friendlyNames[f].padEnd(25);
|
||||||
|
let value = stats[f];
|
||||||
|
|
||||||
|
// If this statistic is a measure of CPU time, divide by 1,000 to turn milliseconds into seconds.
|
||||||
|
if (name.includes("time"))
|
||||||
|
{
|
||||||
|
value = Math.round(value / 1000);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
text.textContent += name + value + "\n";
|
||||||
|
}
|
||||||
|
|
||||||
|
// Calculate the percentage of time (to two decimal places) spent waiting for fingerprints
|
||||||
|
const percentWait = Math.round((stats.FingerprintCPUTime * 10_000) / stats.TotalCPUTime) / 100;
|
||||||
|
|
||||||
|
// Breakdown CPU time by analysis component
|
||||||
|
text.textContent += "\nCPU time breakdown:\n";
|
||||||
|
text.textContent += "Fingerprint generation " + percentWait + "%\n";
|
||||||
|
|
||||||
Dashboard.hideLoadingMsg();
|
Dashboard.hideLoadingMsg();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -20,6 +20,11 @@ public class AnalysisStatistics
|
|||||||
/// </summary>
|
/// </summary>
|
||||||
public int TotalQueuedEpisodes { get; set; }
|
public int TotalQueuedEpisodes { get; set; }
|
||||||
|
|
||||||
|
/// <summary>
|
||||||
|
/// Gets the number of times an index search successfully located a pair of introductions.
|
||||||
|
/// </summary>
|
||||||
|
public ThreadSafeInteger IndexSearches { get; } = new ThreadSafeInteger();
|
||||||
|
|
||||||
/// <summary>
|
/// <summary>
|
||||||
/// Gets the number of times a quick scan successfully located a pair of introductions.
|
/// Gets the number of times a quick scan successfully located a pair of introductions.
|
||||||
/// </summary>
|
/// </summary>
|
||||||
@ -89,6 +94,11 @@ public class ThreadSafeInteger
|
|||||||
/// <param name="start">Start time.</param>
|
/// <param name="start">Start time.</param>
|
||||||
public void AddDuration(DateTime start)
|
public void AddDuration(DateTime start)
|
||||||
{
|
{
|
||||||
|
if (start == DateTime.MinValue)
|
||||||
|
{
|
||||||
|
return;
|
||||||
|
}
|
||||||
|
|
||||||
var elapsed = DateTime.Now.Subtract(start);
|
var elapsed = DateTime.Now.Subtract(start);
|
||||||
Add((int)elapsed.TotalMilliseconds);
|
Add((int)elapsed.TotalMilliseconds);
|
||||||
}
|
}
|
||||||
|
@ -392,7 +392,8 @@ public class FingerprinterTask : IScheduledTask
|
|||||||
lhsEpisode.EpisodeId,
|
lhsEpisode.EpisodeId,
|
||||||
lhsFingerprint,
|
lhsFingerprint,
|
||||||
rhsEpisode.EpisodeId,
|
rhsEpisode.EpisodeId,
|
||||||
rhsFingerprint);
|
rhsFingerprint,
|
||||||
|
true);
|
||||||
}
|
}
|
||||||
|
|
||||||
/// <summary>
|
/// <summary>
|
||||||
@ -402,53 +403,86 @@ public class FingerprinterTask : IScheduledTask
|
|||||||
/// <param name="lhsPoints">First episode fingerprint points.</param>
|
/// <param name="lhsPoints">First episode fingerprint points.</param>
|
||||||
/// <param name="rhsId">Second episode id.</param>
|
/// <param name="rhsId">Second episode id.</param>
|
||||||
/// <param name="rhsPoints">Second episode fingerprint points.</param>
|
/// <param name="rhsPoints">Second episode fingerprint points.</param>
|
||||||
|
/// <param name="isFirstPass">If this was called as part of the first analysis pass, add the elapsed time to the statistics.</param>
|
||||||
/// <returns>Intros for the first and second episodes.</returns>
|
/// <returns>Intros for the first and second episodes.</returns>
|
||||||
public (Intro Lhs, Intro Rhs) FingerprintEpisodes(
|
public (Intro Lhs, Intro Rhs) FingerprintEpisodes(
|
||||||
Guid lhsId,
|
Guid lhsId,
|
||||||
ReadOnlyCollection<uint> lhsPoints,
|
ReadOnlyCollection<uint> lhsPoints,
|
||||||
Guid rhsId,
|
Guid rhsId,
|
||||||
ReadOnlyCollection<uint> rhsPoints)
|
ReadOnlyCollection<uint> rhsPoints,
|
||||||
|
bool isFirstPass)
|
||||||
{
|
{
|
||||||
var start = DateTime.Now;
|
// If this isn't running as part of the first analysis pass, don't count this CPU time as first pass time.
|
||||||
var lhsRanges = new List<TimeRange>();
|
var start = isFirstPass ? DateTime.Now : DateTime.MinValue;
|
||||||
var rhsRanges = new List<TimeRange>();
|
|
||||||
|
|
||||||
// Compare all elements of the shortest fingerprint to the other fingerprint.
|
// ===== Method 1: Inverted indexes =====
|
||||||
var limit = Math.Min(lhsPoints.Count, rhsPoints.Count);
|
// Creates an inverted fingerprint point index for both episodes.
|
||||||
|
// For every point which is a 100% match, search for an introduction at that point.
|
||||||
|
var (lhsRanges, rhsRanges) = SearchInvertedIndex(lhsPoints, rhsPoints);
|
||||||
|
|
||||||
// First, test if an intro can be found within the first 5 seconds of the episodes (±5/0.128 = ±40 samples).
|
if (lhsRanges.Count > 0)
|
||||||
var (lhsContiguous, rhsContiguous) = ShiftEpisodes(lhsPoints, rhsPoints, -40, 40);
|
|
||||||
lhsRanges.AddRange(lhsContiguous);
|
|
||||||
rhsRanges.AddRange(rhsContiguous);
|
|
||||||
|
|
||||||
// If no valid ranges were found, re-analyze the episodes considering all possible shifts.
|
|
||||||
if (lhsRanges.Count == 0)
|
|
||||||
{
|
{
|
||||||
_logger.LogTrace("quick scan unsuccessful, falling back to full scan (±{Limit})", limit);
|
_logger.LogTrace("Index search successful");
|
||||||
analysisStatistics.FullScans.Increment();
|
analysisStatistics.IndexSearches.Increment();
|
||||||
|
analysisStatistics.FirstPassCPUTime.AddDuration(start);
|
||||||
|
|
||||||
(lhsContiguous, rhsContiguous) = ShiftEpisodes(lhsPoints, rhsPoints, -1 * limit, limit);
|
return GetLongestTimeRange(lhsId, lhsRanges, rhsId, rhsRanges);
|
||||||
lhsRanges.AddRange(lhsContiguous);
|
|
||||||
rhsRanges.AddRange(rhsContiguous);
|
|
||||||
}
|
}
|
||||||
else
|
|
||||||
|
// ===== Method 2: Quick scan =====
|
||||||
|
// Tests if an intro can be found within the first 5 seconds of the episodes. ±5/0.128 = ±40 samples.
|
||||||
|
(lhsRanges, rhsRanges) = ShiftEpisodes(lhsPoints, rhsPoints, -40, 40);
|
||||||
|
|
||||||
|
if (lhsRanges.Count > 0)
|
||||||
{
|
{
|
||||||
_logger.LogTrace("quick scan successful");
|
_logger.LogTrace("Quick scan successful");
|
||||||
analysisStatistics.QuickScans.Increment();
|
analysisStatistics.QuickScans.Increment();
|
||||||
|
analysisStatistics.FirstPassCPUTime.AddDuration(start);
|
||||||
|
|
||||||
|
return GetLongestTimeRange(lhsId, lhsRanges, rhsId, rhsRanges);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (lhsRanges.Count == 0)
|
// ===== Method 3: Full scan =====
|
||||||
|
// Compares all elements of the shortest fingerprint to the other fingerprint.
|
||||||
|
var limit = Math.Min(lhsPoints.Count, rhsPoints.Count);
|
||||||
|
(lhsRanges, rhsRanges) = ShiftEpisodes(lhsPoints, rhsPoints, -1 * limit, limit);
|
||||||
|
|
||||||
|
if (lhsRanges.Count > 0)
|
||||||
{
|
{
|
||||||
|
_logger.LogTrace("Full scan successful");
|
||||||
|
analysisStatistics.FullScans.Increment();
|
||||||
|
analysisStatistics.FirstPassCPUTime.AddDuration(start);
|
||||||
|
|
||||||
|
return GetLongestTimeRange(lhsId, lhsRanges, rhsId, rhsRanges);
|
||||||
|
}
|
||||||
|
|
||||||
|
// No method was able to find an introduction, return nothing.
|
||||||
|
|
||||||
_logger.LogTrace(
|
_logger.LogTrace(
|
||||||
"Unable to find a shared introduction sequence between {LHS} and {RHS}",
|
"Unable to find a shared introduction sequence between {LHS} and {RHS}",
|
||||||
lhsId,
|
lhsId,
|
||||||
rhsId);
|
rhsId);
|
||||||
|
|
||||||
analysisStatistics.FirstPassCPUTime.AddDuration(start);
|
analysisStatistics.FirstPassCPUTime.AddDuration(start);
|
||||||
|
|
||||||
return (new Intro(lhsId), new Intro(rhsId));
|
return (new Intro(lhsId), new Intro(rhsId));
|
||||||
}
|
}
|
||||||
|
|
||||||
// After comparing both episodes at all possible shift positions, store the longest time range as the intro.
|
/// <summary>
|
||||||
|
/// Locates the longest range of similar audio and returns an Intro class for each range.
|
||||||
|
/// </summary>
|
||||||
|
/// <param name="lhsId">First episode id.</param>
|
||||||
|
/// <param name="lhsRanges">First episode shared timecodes.</param>
|
||||||
|
/// <param name="rhsId">Second episode id.</param>
|
||||||
|
/// <param name="rhsRanges">Second episode shared timecodes.</param>
|
||||||
|
/// <returns>Intros for the first and second episodes.</returns>
|
||||||
|
private (Intro Lhs, Intro Rhs) GetLongestTimeRange(
|
||||||
|
Guid lhsId,
|
||||||
|
List<TimeRange> lhsRanges,
|
||||||
|
Guid rhsId,
|
||||||
|
List<TimeRange> rhsRanges)
|
||||||
|
{
|
||||||
|
// Store the longest time range as the introduction.
|
||||||
lhsRanges.Sort();
|
lhsRanges.Sort();
|
||||||
rhsRanges.Sort();
|
rhsRanges.Sort();
|
||||||
|
|
||||||
@ -466,10 +500,54 @@ public class FingerprinterTask : IScheduledTask
|
|||||||
rhsIntro.Start = 0;
|
rhsIntro.Start = 0;
|
||||||
}
|
}
|
||||||
|
|
||||||
analysisStatistics.FirstPassCPUTime.AddDuration(start);
|
// Create Intro classes for each time range.
|
||||||
return (new Intro(lhsId, lhsIntro), new Intro(rhsId, rhsIntro));
|
return (new Intro(lhsId, lhsIntro), new Intro(rhsId, rhsIntro));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/// <summary>
|
||||||
|
/// Search for a shared introduction sequence using inverted indexes.
|
||||||
|
/// </summary>
|
||||||
|
/// <param name="lhsPoints">Left episode fingerprint points.</param>
|
||||||
|
/// <param name="rhsPoints">Right episode fingerprint points.</param>
|
||||||
|
/// <returns>List of shared TimeRanges between the left and right episodes.</returns>
|
||||||
|
private (List<TimeRange> Lhs, List<TimeRange> Rhs) SearchInvertedIndex(
|
||||||
|
ReadOnlyCollection<uint> lhsPoints,
|
||||||
|
ReadOnlyCollection<uint> rhsPoints)
|
||||||
|
{
|
||||||
|
var lhsRanges = new List<TimeRange>();
|
||||||
|
var rhsRanges = new List<TimeRange>();
|
||||||
|
|
||||||
|
// Generate inverted indexes for the left and right episodes.
|
||||||
|
var lhsIndex = Chromaprint.CreateInvertedIndex(lhsPoints);
|
||||||
|
var rhsIndex = Chromaprint.CreateInvertedIndex(rhsPoints);
|
||||||
|
var indexShifts = new HashSet<int>();
|
||||||
|
|
||||||
|
// For all audio points in the left episode, check if the right episode has a point which matches exactly.
|
||||||
|
// If an exact match is found, calculate the shift that must be used to align the points.
|
||||||
|
foreach (var kvp in lhsIndex)
|
||||||
|
{
|
||||||
|
var point = kvp.Key;
|
||||||
|
|
||||||
|
if (rhsIndex.ContainsKey(point))
|
||||||
|
{
|
||||||
|
// TODO: consider all timecodes before falling back
|
||||||
|
var lhsFirst = (int)lhsIndex[point][0];
|
||||||
|
var rhsFirst = (int)rhsIndex[point][0];
|
||||||
|
indexShifts.Add(rhsFirst - lhsFirst);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// Use all discovered shifts to compare the episodes.
|
||||||
|
foreach (var shift in indexShifts)
|
||||||
|
{
|
||||||
|
var (lhsIndexContiguous, rhsIndexContiguous) = ShiftEpisodes(lhsPoints, rhsPoints, shift, shift);
|
||||||
|
lhsRanges.AddRange(lhsIndexContiguous);
|
||||||
|
rhsRanges.AddRange(rhsIndexContiguous);
|
||||||
|
}
|
||||||
|
|
||||||
|
return (lhsRanges, rhsRanges);
|
||||||
|
}
|
||||||
|
|
||||||
/// <summary>
|
/// <summary>
|
||||||
/// Shifts a pair of episodes through the range of provided shift amounts and returns discovered contiguous time ranges.
|
/// Shifts a pair of episodes through the range of provided shift amounts and returns discovered contiguous time ranges.
|
||||||
/// </summary>
|
/// </summary>
|
||||||
|
Loading…
x
Reference in New Issue
Block a user