mejortorrent: remove non-english alphanumeric characters. resolves #13716 (#13720)

This commit is contained in:
ilike2burnthing
2022-11-15 21:44:33 +00:00
committed by GitHub
parent 75b96ae2ea
commit 6f10bcf138

View File

@@ -417,23 +417,23 @@ namespace Jackett.Common.Indexers
private static TorznabQuery ParseQuery(TorznabQuery query) private static TorznabQuery ParseQuery(TorznabQuery query)
{ {
// Eg. Marco.Polo.2014.S02E08 // Eg. Doctor.Who.2005.(Доктор.Кто).S02E08
// the season/episode part is already parsed by Jackett // the season/episode part is already parsed by Jackett
// query.SanitizedSearchTerm = Marco.Polo.2014. // query.GetQueryString = Doctor.Who.2005.(Доктор.Кто).
// query.Season = 2 // query.Season = 2
// query.Episode = 8 // query.Episode = 8
var searchTerm = query.SanitizedSearchTerm; var searchTerm = query.GetQueryString();
// replace punctuation symbols with spaces // replace non-english alphanumeric characters with spaces
// searchTerm = Marco Polo 2014 // searchTerm = Doctor Who 2005
searchTerm = Regex.Replace(searchTerm, @"[-._\(\)@/\\\[\]\+\%]", " "); searchTerm = Regex.Replace(searchTerm, @"[^a-zA-Z0-9]+", " ");
searchTerm = Regex.Replace(searchTerm, @"\s+", " "); searchTerm = Regex.Replace(searchTerm, @"\s+", " ");
searchTerm = searchTerm.Trim(); searchTerm = searchTerm.Trim();
// we parse the year and remove it from search // we parse the year and remove it from search
// searchTerm = Marco Polo // searchTerm = Doctor Who
// query.Year = 2014 // query.Year = 2005
var r = new Regex("([ ]+([0-9]{4}))$", RegexOptions.IgnoreCase); var r = new Regex("([ ]+([0-9]{4}))$", RegexOptions.IgnoreCase);
var m = r.Match(searchTerm); var m = r.Match(searchTerm);
if (m.Success) if (m.Success)