2010-10-21 04:49:23 +03:00
|
|
|
using System;
|
|
|
|
using System.Collections.Generic;
|
|
|
|
using System.IO;
|
|
|
|
using System.Linq;
|
|
|
|
using System.Text;
|
|
|
|
using System.Text.RegularExpressions;
|
|
|
|
using NLog;
|
|
|
|
using NzbDrone.Core.Model;
|
|
|
|
using NzbDrone.Core.Providers;
|
|
|
|
using NzbDrone.Core.Repository.Quality;
|
|
|
|
|
|
|
|
namespace NzbDrone.Core
|
|
|
|
{
|
|
|
|
internal static class Parser
|
|
|
|
{
|
|
|
|
private static readonly Logger Logger = LogManager.GetCurrentClassLogger();
|
|
|
|
|
|
|
|
private static readonly Regex[] ReportTitleRegex = new[]
|
|
|
|
{
|
2011-03-24 17:19:21 +02:00
|
|
|
new Regex(@"(?<title>.+?)?\W?(?<year>\d+?)?\WS?(?<season>\d+)(?:\-|\.|[a-z])(?<episode>\d+)\W(?!\\)", RegexOptions.IgnoreCase | RegexOptions.Compiled),
|
2011-03-25 06:15:02 +02:00
|
|
|
new Regex(@"(?<title>.+?)?\W?(?<year>\d+?)?\WS?(?<season>\d+)(?<episode>\d{2})\W(?!\\)", RegexOptions.IgnoreCase | RegexOptions.Compiled) //Supports 103/113 naming
|
2010-10-21 04:49:23 +03:00
|
|
|
};
|
|
|
|
|
2011-03-25 06:15:02 +02:00
|
|
|
private static readonly Regex[] SeasonReportTitleRegex = new[]
|
|
|
|
{
|
|
|
|
new Regex(@"(?<title>.+?)?\W?(?<year>\d{4}?)?\W(?:S|Season)?\W?(?<season>\d+)(?!\\)", RegexOptions.IgnoreCase | RegexOptions.Compiled),
|
|
|
|
};
|
|
|
|
|
2010-10-21 04:49:23 +03:00
|
|
|
private static readonly Regex NormalizeRegex = new Regex(@"((\s|^)the(\s|$))|((\s|^)and(\s|$))|[^a-z]", RegexOptions.IgnoreCase | RegexOptions.Compiled);
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// Parses a post title into list of episodes it contains
|
|
|
|
/// </summary>
|
|
|
|
/// <param name="title">Title of the report</param>
|
|
|
|
/// <returns>List of episodes contained to the post</returns>
|
2011-04-04 06:50:12 +03:00
|
|
|
internal static EpisodeParseResult ParseEpisodeInfo(string title)
|
2010-10-21 04:49:23 +03:00
|
|
|
{
|
|
|
|
Logger.Trace("Parsing string '{0}'", title);
|
|
|
|
|
2011-04-04 08:24:19 +03:00
|
|
|
foreach (var regex in ReportTitleRegex)
|
2010-10-21 04:49:23 +03:00
|
|
|
{
|
|
|
|
var match = regex.Matches(title);
|
|
|
|
|
|
|
|
if (match.Count != 0)
|
|
|
|
{
|
|
|
|
var seriesName = NormalizeTitle(match[0].Groups["title"].Value);
|
2011-02-03 22:09:19 +02:00
|
|
|
var year = 0;
|
|
|
|
Int32.TryParse(match[0].Groups["year"].Value, out year);
|
|
|
|
|
|
|
|
if (year < 1900 || year > DateTime.Now.Year + 1)
|
|
|
|
{
|
|
|
|
year = 0;
|
|
|
|
}
|
2010-10-21 04:49:23 +03:00
|
|
|
|
2011-04-04 06:50:12 +03:00
|
|
|
var parsedEpisode = new EpisodeParseResult
|
2010-10-21 04:49:23 +03:00
|
|
|
{
|
2011-04-04 08:24:19 +03:00
|
|
|
Proper = title.ToLower().Contains("proper"),
|
2011-04-04 06:50:12 +03:00
|
|
|
SeriesTitle = seriesName,
|
|
|
|
SeasonNumber = Convert.ToInt32(match[0].Groups["season"].Value),
|
|
|
|
Year = year,
|
|
|
|
Episodes = new List<int>()
|
|
|
|
};
|
2011-02-03 22:09:19 +02:00
|
|
|
|
2011-04-04 06:50:12 +03:00
|
|
|
foreach (Match matchGroup in match)
|
|
|
|
{
|
|
|
|
parsedEpisode.Episodes.Add(Convert.ToInt32(matchGroup.Groups["episode"].Value));
|
2011-02-03 22:09:19 +02:00
|
|
|
|
2011-04-04 06:50:12 +03:00
|
|
|
}
|
2010-10-21 04:49:23 +03:00
|
|
|
|
2011-04-04 07:20:01 +03:00
|
|
|
parsedEpisode.Quality = ParseQuality(title);
|
|
|
|
|
2011-04-04 06:50:12 +03:00
|
|
|
Logger.Trace("Episode Parsed. {0}", parsedEpisode);
|
2010-10-21 04:49:23 +03:00
|
|
|
|
2011-04-04 07:20:01 +03:00
|
|
|
return parsedEpisode;
|
2010-10-21 04:49:23 +03:00
|
|
|
}
|
|
|
|
}
|
2011-04-05 09:33:24 +03:00
|
|
|
Logger.Warn("Unable to parse text into episode info. {0}", title);
|
2011-04-04 07:20:01 +03:00
|
|
|
return null;
|
2010-10-21 04:49:23 +03:00
|
|
|
}
|
|
|
|
|
2011-03-25 06:15:02 +02:00
|
|
|
/// <summary>
|
|
|
|
/// Parses a post title into season it contains
|
|
|
|
/// </summary>
|
|
|
|
/// <param name="title">Title of the report</param>
|
|
|
|
/// <returns>Season information contained in the post</returns>
|
|
|
|
internal static SeasonParseResult ParseSeasonInfo(string title)
|
|
|
|
{
|
|
|
|
Logger.Trace("Parsing string '{0}'", title);
|
|
|
|
|
|
|
|
foreach (var regex in ReportTitleRegex)
|
|
|
|
{
|
|
|
|
var match = regex.Matches(title);
|
|
|
|
|
|
|
|
if (match.Count != 0)
|
|
|
|
{
|
|
|
|
var seriesName = NormalizeTitle(match[0].Groups["title"].Value);
|
|
|
|
var year = 0;
|
|
|
|
Int32.TryParse(match[0].Groups["year"].Value, out year);
|
|
|
|
|
|
|
|
if (year < 1900 || year > DateTime.Now.Year + 1)
|
|
|
|
{
|
|
|
|
year = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
var seasonNumber = Convert.ToInt32(match[0].Groups["season"].Value);
|
|
|
|
|
|
|
|
var result = new SeasonParseResult
|
|
|
|
{
|
|
|
|
SeriesTitle = seriesName,
|
|
|
|
SeasonNumber = seasonNumber,
|
|
|
|
Year = year
|
|
|
|
};
|
|
|
|
|
2011-04-05 01:46:07 +03:00
|
|
|
|
|
|
|
result.Quality = ParseQuality(title);
|
2011-03-25 06:15:02 +02:00
|
|
|
|
|
|
|
Logger.Trace("Season Parsed. {0}", result);
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return null; //Return null
|
|
|
|
}
|
|
|
|
|
2011-03-03 10:50:33 +02:00
|
|
|
/// <summary>
|
|
|
|
/// Parses a post title to find the series that relates to it
|
|
|
|
/// </summary>
|
|
|
|
/// <param name="title">Title of the report</param>
|
|
|
|
/// <returns>Normalized Series Name</returns>
|
|
|
|
internal static string ParseSeriesName(string title)
|
|
|
|
{
|
|
|
|
Logger.Trace("Parsing string '{0}'", title);
|
|
|
|
|
|
|
|
foreach (var regex in ReportTitleRegex)
|
|
|
|
{
|
|
|
|
var match = regex.Matches(title);
|
|
|
|
|
|
|
|
if (match.Count != 0)
|
|
|
|
{
|
|
|
|
var seriesName = NormalizeTitle(match[0].Groups["title"].Value);
|
|
|
|
var year = 0;
|
|
|
|
Int32.TryParse(match[0].Groups["year"].Value, out year);
|
|
|
|
|
|
|
|
if (year < 1900 || year > DateTime.Now.Year + 1)
|
|
|
|
{
|
|
|
|
year = 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
Logger.Trace("Series Parsed. {0}", seriesName);
|
|
|
|
return seriesName;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return String.Empty;
|
|
|
|
}
|
|
|
|
|
2010-10-21 04:49:23 +03:00
|
|
|
/// <summary>
|
|
|
|
/// Parses proper status out of a report title
|
|
|
|
/// </summary>
|
|
|
|
/// <param name="title">Title of the report</param>
|
|
|
|
/// <returns></returns>
|
|
|
|
internal static bool ParseProper(string title)
|
|
|
|
{
|
|
|
|
return title.ToLower().Contains("proper");
|
|
|
|
}
|
|
|
|
|
2011-04-05 01:46:07 +03:00
|
|
|
private static QualityTypes ParseQuality(string name)
|
2010-10-21 04:49:23 +03:00
|
|
|
{
|
|
|
|
Logger.Trace("Trying to parse quality for {0}", name);
|
|
|
|
|
|
|
|
var result = QualityTypes.Unknown;
|
|
|
|
name = name.ToLowerInvariant();
|
|
|
|
|
|
|
|
if (name.Contains("dvd"))
|
|
|
|
return QualityTypes.DVD;
|
2011-02-03 21:47:51 +02:00
|
|
|
|
|
|
|
if (name.Contains("bdrip") || name.Contains("brrip"))
|
|
|
|
{
|
|
|
|
return QualityTypes.BDRip;
|
|
|
|
}
|
|
|
|
|
2010-10-21 04:49:23 +03:00
|
|
|
if (name.Contains("xvid") || name.Contains("divx"))
|
|
|
|
{
|
2011-02-03 21:47:51 +02:00
|
|
|
if (name.Contains("bluray"))
|
2010-10-21 04:49:23 +03:00
|
|
|
{
|
2011-02-03 21:47:51 +02:00
|
|
|
return QualityTypes.BDRip;
|
2010-10-21 04:49:23 +03:00
|
|
|
}
|
2011-02-03 21:47:51 +02:00
|
|
|
|
2010-10-21 04:49:23 +03:00
|
|
|
return QualityTypes.TV;
|
|
|
|
}
|
|
|
|
|
2011-02-03 21:47:51 +02:00
|
|
|
if (name.Contains("bluray"))
|
2011-02-01 03:01:49 +02:00
|
|
|
{
|
2011-03-27 03:16:50 +03:00
|
|
|
if (name.Contains("720p"))
|
|
|
|
return QualityTypes.Bluray720;
|
|
|
|
|
|
|
|
if (name.Contains("1080p"))
|
|
|
|
return QualityTypes.Bluray1080;
|
|
|
|
|
|
|
|
return QualityTypes.Bluray720;
|
2011-02-01 03:01:49 +02:00
|
|
|
}
|
2010-10-21 04:49:23 +03:00
|
|
|
if (name.Contains("web-dl"))
|
|
|
|
return QualityTypes.WEBDL;
|
|
|
|
if (name.Contains("x264") || name.Contains("h264") || name.Contains("720p"))
|
|
|
|
return QualityTypes.HDTV;
|
|
|
|
|
|
|
|
//Based on extension
|
|
|
|
if (result == QualityTypes.Unknown)
|
|
|
|
{
|
|
|
|
switch (new FileInfo(name).Extension.ToLower())
|
|
|
|
{
|
|
|
|
case ".avi":
|
|
|
|
case ".xvid":
|
|
|
|
case ".wmv":
|
|
|
|
{
|
|
|
|
result = QualityTypes.TV;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
case ".mkv":
|
|
|
|
{
|
|
|
|
result = QualityTypes.HDTV;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
Logger.Trace("Quality Parsed:{0} Title:", result, name);
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// Normalizes the title. removing all non-word characters as well as common tokens
|
|
|
|
/// such as 'the' and 'and'
|
|
|
|
/// </summary>
|
|
|
|
/// <param name="title">title</param>
|
|
|
|
/// <returns></returns>
|
|
|
|
internal static string NormalizeTitle(string title)
|
|
|
|
{
|
|
|
|
return NormalizeRegex.Replace(title, String.Empty).ToLower();
|
|
|
|
}
|
2010-10-24 10:46:58 +03:00
|
|
|
|
2010-11-06 18:01:46 +02:00
|
|
|
//Note: changing case on path is a problem for running on mono/*nix
|
2011-03-10 02:44:21 +02:00
|
|
|
//Not going to change the casing any more... Looks Ugly in UI anyways :P
|
2010-10-24 10:46:58 +03:00
|
|
|
public static string NormalizePath(string path)
|
|
|
|
{
|
|
|
|
if (String.IsNullOrEmpty(path))
|
|
|
|
throw new ArgumentException("Path can not be null or empty");
|
2010-11-06 18:01:46 +02:00
|
|
|
|
2011-02-03 21:47:51 +02:00
|
|
|
var info = new FileInfo(path);
|
|
|
|
|
|
|
|
if (info.FullName.StartsWith(@"\\")) //UNC
|
|
|
|
{
|
2011-03-10 02:44:21 +02:00
|
|
|
return info.FullName.TrimEnd('/', '\\', ' ');
|
2011-02-03 21:47:51 +02:00
|
|
|
}
|
2010-11-06 18:01:46 +02:00
|
|
|
|
2011-03-10 02:44:21 +02:00
|
|
|
return info.FullName.Trim('/', '\\', ' ');
|
2010-10-24 10:46:58 +03:00
|
|
|
}
|
2011-01-29 08:10:22 +02:00
|
|
|
|
|
|
|
|
2010-10-21 04:49:23 +03:00
|
|
|
}
|
2011-04-05 05:48:46 +03:00
|
|
|
}
|