You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
146 lines
4.5 KiB
146 lines
4.5 KiB
using System;
|
|
using System.Collections.Generic;
|
|
using System.Text.RegularExpressions;
|
|
using NzbDrone.Common.Extensions;
|
|
using NzbDrone.Core.Movies;
|
|
|
|
namespace NzbDrone.Core.MetadataSource
|
|
{
|
|
public class SearchMovieComparer : IComparer<Movie>
|
|
{
|
|
private static readonly Regex RegexCleanPunctuation = new Regex("[-._:]", RegexOptions.Compiled);
|
|
private static readonly Regex RegexCleanCountryYearPostfix = new Regex(@"(?<=.+)( \([A-Z]{2}\)| \(\d{4}\)| \([A-Z]{2}\) \(\d{4}\))$", RegexOptions.Compiled);
|
|
private static readonly Regex ArticleRegex = new Regex(@"^(a|an|the)\s", RegexOptions.IgnoreCase | RegexOptions.Compiled);
|
|
|
|
public string SearchQuery { get; private set; }
|
|
|
|
private readonly string _searchQueryWithoutYear;
|
|
private int? _year;
|
|
|
|
public SearchMovieComparer(string searchQuery)
|
|
{
|
|
SearchQuery = searchQuery;
|
|
|
|
var match = Regex.Match(SearchQuery, @"^(?<query>.+)\s+(?:\((?<year>\d{4})\)|(?<year>\d{4}))$");
|
|
if (match.Success)
|
|
{
|
|
_searchQueryWithoutYear = match.Groups["query"].Value.ToLowerInvariant();
|
|
_year = int.Parse(match.Groups["year"].Value);
|
|
}
|
|
else
|
|
{
|
|
_searchQueryWithoutYear = searchQuery.ToLowerInvariant();
|
|
}
|
|
}
|
|
|
|
public int Compare(Movie x, Movie y)
|
|
{
|
|
int result = 0;
|
|
|
|
// Prefer exact matches
|
|
result = Compare(x, y, s => CleanPunctuation(s.Title).Equals(CleanPunctuation(SearchQuery)));
|
|
if (result != 0)
|
|
{
|
|
return -result;
|
|
}
|
|
|
|
// Remove Articles (a/an/the)
|
|
result = Compare(x, y, s => CleanArticles(s.Title).Equals(CleanArticles(SearchQuery)));
|
|
if (result != 0)
|
|
{
|
|
return -result;
|
|
}
|
|
|
|
// Prefer close matches
|
|
result = Compare(x, y, s => CleanPunctuation(s.Title).LevenshteinDistance(CleanPunctuation(SearchQuery)) <= 1);
|
|
if (result != 0)
|
|
{
|
|
return -result;
|
|
}
|
|
|
|
// Compare clean matches by year "Battlestar Galactica 1978"
|
|
result = CompareWithYear(x, y, s => CleanTitle(s.Title).LevenshteinDistance(_searchQueryWithoutYear) <= 1);
|
|
if (result != 0)
|
|
{
|
|
return -result;
|
|
}
|
|
|
|
// Compare prefix matches by year "(CSI: ..."
|
|
result = CompareWithYear(x, y, s => s.Title.ToLowerInvariant().StartsWith(_searchQueryWithoutYear + ":"));
|
|
if (result != 0)
|
|
{
|
|
return -result;
|
|
}
|
|
|
|
return Compare(x, y, s => SearchQuery.LevenshteinDistanceClean(s.Title) - GetYearFactor(s));
|
|
}
|
|
|
|
public int Compare<T>(Movie x, Movie y, Func<Movie, T> keySelector)
|
|
where T : IComparable<T>
|
|
{
|
|
var keyX = keySelector(x);
|
|
var keyY = keySelector(y);
|
|
|
|
return keyX.CompareTo(keyY);
|
|
}
|
|
|
|
public int CompareWithYear(Movie x, Movie y, Predicate<Movie> canMatch)
|
|
{
|
|
var matchX = canMatch(x);
|
|
var matchY = canMatch(y);
|
|
|
|
if (matchX && matchY)
|
|
{
|
|
if (_year.HasValue)
|
|
{
|
|
var result = Compare(x, y, s => s.Year == _year.Value);
|
|
if (result != 0)
|
|
{
|
|
return result;
|
|
}
|
|
}
|
|
|
|
return Compare(x, y, s => s.Year);
|
|
}
|
|
|
|
return matchX.CompareTo(matchY);
|
|
}
|
|
|
|
private string CleanPunctuation(string title)
|
|
{
|
|
title = RegexCleanPunctuation.Replace(title, "");
|
|
|
|
return title.ToLowerInvariant();
|
|
}
|
|
|
|
private string CleanTitle(string title)
|
|
{
|
|
title = RegexCleanPunctuation.Replace(title, "");
|
|
title = RegexCleanCountryYearPostfix.Replace(title, "");
|
|
|
|
return title.ToLowerInvariant();
|
|
}
|
|
|
|
private string CleanArticles(string title)
|
|
{
|
|
title = ArticleRegex.Replace(title, "");
|
|
|
|
return title.Trim().ToLowerInvariant();
|
|
}
|
|
|
|
private int GetYearFactor(Movie movie)
|
|
{
|
|
if (_year.HasValue)
|
|
{
|
|
var offset = Math.Abs(movie.Year - _year.Value);
|
|
if (offset <= 1)
|
|
{
|
|
return 20 - (10 * offset);
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
}
|
|
}
|