2011-04-22 02:23:31 +00:00
|
|
|
using System;
|
2011-04-24 22:32:08 +00:00
|
|
|
using System.Collections.Generic;
|
2011-09-04 03:05:44 +00:00
|
|
|
using System.Linq;
|
2011-04-25 20:21:52 +00:00
|
|
|
using System.Net;
|
2011-04-21 01:29:41 +00:00
|
|
|
using System.ServiceModel.Syndication;
|
2011-07-03 22:32:36 +00:00
|
|
|
using System.Text.RegularExpressions;
|
2011-04-04 03:50:12 +00:00
|
|
|
using NLog;
|
2012-02-11 00:48:20 +00:00
|
|
|
using NzbDrone.Common;
|
2011-04-04 03:50:12 +00:00
|
|
|
using NzbDrone.Core.Model;
|
2011-04-04 07:21:07 +00:00
|
|
|
using NzbDrone.Core.Providers.Core;
|
2011-04-04 03:50:12 +00:00
|
|
|
|
2013-02-21 07:07:34 +00:00
|
|
|
namespace NzbDrone.Core.Indexers.Providers
|
2011-04-04 03:50:12 +00:00
|
|
|
{
|
2011-05-20 04:21:18 +00:00
|
|
|
public abstract class IndexerBase
|
2011-04-04 03:50:12 +00:00
|
|
|
{
|
2011-04-22 06:23:29 +00:00
|
|
|
protected readonly Logger _logger;
|
2012-12-21 08:35:20 +00:00
|
|
|
protected readonly HttpProvider _httpProvider;
|
2011-05-20 03:47:07 +00:00
|
|
|
protected readonly ConfigProvider _configProvider;
|
2011-04-19 00:12:06 +00:00
|
|
|
|
2012-09-06 15:37:38 +00:00
|
|
|
protected static readonly Regex TitleSearchRegex = new Regex(@"[\W]", RegexOptions.IgnoreCase | RegexOptions.Compiled);
|
2012-02-27 05:33:24 +00:00
|
|
|
protected static readonly Regex RemoveThe = new Regex(@"^the\s", RegexOptions.IgnoreCase | RegexOptions.Compiled);
|
2011-07-03 22:32:36 +00:00
|
|
|
|
2011-05-26 04:25:59 +00:00
|
|
|
protected IndexerBase(HttpProvider httpProvider, ConfigProvider configProvider)
|
2011-04-04 06:53:22 +00:00
|
|
|
{
|
2011-04-05 05:30:13 +00:00
|
|
|
_httpProvider = httpProvider;
|
2011-05-20 03:47:07 +00:00
|
|
|
_configProvider = configProvider;
|
2011-05-01 08:04:44 +00:00
|
|
|
|
2011-04-29 06:32:51 +00:00
|
|
|
_logger = LogManager.GetLogger(GetType().ToString());
|
2011-04-04 06:53:22 +00:00
|
|
|
}
|
|
|
|
|
2011-05-27 03:54:28 +00:00
|
|
|
public IndexerBase()
|
|
|
|
{
|
2011-05-27 06:03:57 +00:00
|
|
|
|
2011-05-27 03:54:28 +00:00
|
|
|
}
|
|
|
|
|
2011-04-04 03:50:12 +00:00
|
|
|
/// <summary>
|
2011-04-19 00:12:06 +00:00
|
|
|
/// Gets the name for the feed
|
2011-04-04 03:50:12 +00:00
|
|
|
/// </summary>
|
2011-04-19 00:12:06 +00:00
|
|
|
public abstract string Name { get; }
|
2011-04-04 03:50:12 +00:00
|
|
|
|
2011-04-04 06:53:22 +00:00
|
|
|
/// <summary>
|
2011-04-21 01:26:13 +00:00
|
|
|
/// Gets the source URL for the feed
|
2011-04-04 06:53:22 +00:00
|
|
|
/// </summary>
|
2011-04-21 01:26:13 +00:00
|
|
|
protected abstract string[] Urls { get; }
|
2011-04-04 06:53:22 +00:00
|
|
|
|
2012-02-01 01:37:36 +00:00
|
|
|
public abstract bool IsConfigured { get; }
|
|
|
|
|
2012-04-14 22:33:58 +00:00
|
|
|
/// <summary>
|
|
|
|
/// Should the indexer be enabled by default?
|
|
|
|
/// </summary>
|
|
|
|
public virtual bool EnabledByDefault
|
|
|
|
{
|
|
|
|
get { return false; }
|
|
|
|
}
|
2012-02-01 01:37:36 +00:00
|
|
|
|
2011-05-27 02:12:28 +00:00
|
|
|
/// <summary>
|
|
|
|
/// Gets the credential.
|
|
|
|
/// </summary>
|
|
|
|
protected virtual NetworkCredential Credentials
|
|
|
|
{
|
|
|
|
get { return null; }
|
|
|
|
}
|
|
|
|
|
2011-11-29 06:49:38 +00:00
|
|
|
protected abstract IList<String> GetEpisodeSearchUrls(string seriesTitle, int seasonNumber, int episodeNumber);
|
|
|
|
protected abstract IList<String> GetDailyEpisodeSearchUrls(string seriesTitle, DateTime date);
|
|
|
|
protected abstract IList<String> GetSeasonSearchUrls(string seriesTitle, int seasonNumber);
|
|
|
|
protected abstract IList<String> GetPartialSeasonSearchUrls(string seriesTitle, int seasonNumber, int episodeWildcard);
|
2011-05-26 04:25:59 +00:00
|
|
|
|
2011-04-25 20:21:52 +00:00
|
|
|
/// <summary>
|
2011-05-27 02:12:28 +00:00
|
|
|
/// This method can be overwritten to provide indexer specific info parsing
|
2011-04-25 20:21:52 +00:00
|
|
|
/// </summary>
|
2011-05-27 02:12:28 +00:00
|
|
|
/// <param name="item">RSS item that needs to be parsed</param>
|
|
|
|
/// <param name="currentResult">Result of the built in parse function.</param>
|
|
|
|
/// <returns></returns>
|
|
|
|
protected virtual EpisodeParseResult CustomParser(SyndicationItem item, EpisodeParseResult currentResult)
|
2011-04-25 20:21:52 +00:00
|
|
|
{
|
2011-05-27 02:12:28 +00:00
|
|
|
return currentResult;
|
2011-04-25 20:21:52 +00:00
|
|
|
}
|
|
|
|
|
2012-04-14 23:37:36 +00:00
|
|
|
/// <summary>
|
|
|
|
/// This method can be overwritten to provide pre-parse the title
|
|
|
|
/// </summary>
|
|
|
|
/// <param name="item">RSS item that needs to be parsed</param>
|
|
|
|
/// <returns></returns>
|
|
|
|
protected virtual string TitlePreParser(SyndicationItem item)
|
|
|
|
{
|
|
|
|
return item.Title.Text;
|
|
|
|
}
|
|
|
|
|
2011-05-27 02:12:28 +00:00
|
|
|
/// <summary>
|
|
|
|
/// Generates direct link to download an NZB
|
|
|
|
/// </summary>
|
|
|
|
/// <param name = "item">RSS Feed item to generate the link for</param>
|
|
|
|
/// <returns>Download link URL</returns>
|
|
|
|
protected abstract string NzbDownloadUrl(SyndicationItem item);
|
2011-04-04 06:53:22 +00:00
|
|
|
|
2012-05-02 19:02:39 +00:00
|
|
|
/// <summary>
|
|
|
|
/// Generates link to the NZB info at the indexer
|
|
|
|
/// </summary>
|
|
|
|
/// <param name = "item">RSS Feed item to generate the link for</param>
|
|
|
|
/// <returns>Nzb Info URL</returns>
|
|
|
|
protected abstract string NzbInfoUrl(SyndicationItem item);
|
|
|
|
|
2011-04-04 06:53:22 +00:00
|
|
|
/// <summary>
|
2011-04-10 02:44:01 +00:00
|
|
|
/// Fetches RSS feed and process each news item.
|
2011-04-04 06:53:22 +00:00
|
|
|
/// </summary>
|
2011-05-27 03:54:28 +00:00
|
|
|
public virtual IList<EpisodeParseResult> FetchRss()
|
2011-04-04 03:50:12 +00:00
|
|
|
{
|
2011-05-26 04:25:59 +00:00
|
|
|
_logger.Debug("Fetching feeds from " + Name);
|
2011-05-20 03:47:07 +00:00
|
|
|
|
|
|
|
var result = new List<EpisodeParseResult>();
|
2011-04-04 03:50:12 +00:00
|
|
|
|
2011-12-08 03:54:31 +00:00
|
|
|
|
|
|
|
result = Fetch(Urls);
|
|
|
|
|
2011-05-26 04:25:59 +00:00
|
|
|
|
2012-02-22 04:43:19 +00:00
|
|
|
_logger.Debug("Finished processing feeds from " + Name);
|
2011-05-26 04:25:59 +00:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2011-08-28 05:45:36 +00:00
|
|
|
public virtual IList<EpisodeParseResult> FetchSeason(string seriesTitle, int seasonNumber)
|
|
|
|
{
|
2012-02-25 19:57:56 +00:00
|
|
|
_logger.Debug("Searching {0} for {1} Season {2}", Name, seriesTitle, seasonNumber);
|
2011-08-28 05:45:36 +00:00
|
|
|
|
2011-11-29 06:49:38 +00:00
|
|
|
var searchUrls = GetSeasonSearchUrls(GetQueryTitle(seriesTitle), seasonNumber);
|
2011-12-08 03:54:31 +00:00
|
|
|
var result = Fetch(searchUrls);
|
2011-08-28 05:45:36 +00:00
|
|
|
|
2012-02-25 19:57:56 +00:00
|
|
|
_logger.Info("Finished searching {0} for {1} Season {2}, Found {3}", Name, seriesTitle, seasonNumber, result.Count);
|
2011-08-28 05:45:36 +00:00
|
|
|
return result;
|
|
|
|
}
|
2011-05-26 04:25:59 +00:00
|
|
|
|
2011-09-01 06:58:54 +00:00
|
|
|
public virtual IList<EpisodeParseResult> FetchPartialSeason(string seriesTitle, int seasonNumber, int episodePrefix)
|
|
|
|
{
|
2012-02-25 19:57:56 +00:00
|
|
|
_logger.Debug("Searching {0} for {1} Season {2}, Prefix: {3}", Name, seriesTitle, seasonNumber, episodePrefix);
|
2011-09-01 06:58:54 +00:00
|
|
|
|
|
|
|
|
2011-11-29 06:49:38 +00:00
|
|
|
var searchUrls = GetPartialSeasonSearchUrls(GetQueryTitle(seriesTitle), seasonNumber, episodePrefix);
|
2011-09-01 06:58:54 +00:00
|
|
|
|
2011-12-08 03:54:31 +00:00
|
|
|
var result = Fetch(searchUrls);
|
2011-09-01 06:58:54 +00:00
|
|
|
|
2012-02-25 19:57:56 +00:00
|
|
|
_logger.Info("Finished searching {0} for {1} Season {2}, Found {3}", Name, seriesTitle, seasonNumber, result.Count);
|
2011-09-01 06:58:54 +00:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2011-05-27 03:54:28 +00:00
|
|
|
public virtual IList<EpisodeParseResult> FetchEpisode(string seriesTitle, int seasonNumber, int episodeNumber)
|
2011-05-26 04:25:59 +00:00
|
|
|
{
|
2011-05-27 06:03:57 +00:00
|
|
|
_logger.Debug("Searching {0} for {1}-S{2:00}E{3:00}", Name, seriesTitle, seasonNumber, episodeNumber);
|
2011-05-26 04:25:59 +00:00
|
|
|
|
2011-11-29 06:49:38 +00:00
|
|
|
var searchUrls = GetEpisodeSearchUrls(GetQueryTitle(seriesTitle), seasonNumber, episodeNumber);
|
2011-05-26 04:25:59 +00:00
|
|
|
|
2011-12-08 03:54:31 +00:00
|
|
|
var result = Fetch(searchUrls);
|
2011-05-26 04:25:59 +00:00
|
|
|
|
2012-02-25 19:57:56 +00:00
|
|
|
_logger.Info("Finished searching {0} for {1} S{2:00}E{3:00}, Found {4}", Name, seriesTitle, seasonNumber, episodeNumber, result.Count);
|
2011-05-26 04:25:59 +00:00
|
|
|
return result;
|
2011-04-25 18:16:38 +00:00
|
|
|
|
2011-05-26 04:25:59 +00:00
|
|
|
}
|
2011-04-04 03:50:12 +00:00
|
|
|
|
2011-11-26 06:13:47 +00:00
|
|
|
public virtual IList<EpisodeParseResult> FetchDailyEpisode(string seriesTitle, DateTime airDate)
|
|
|
|
{
|
|
|
|
_logger.Debug("Searching {0} for {1}-{2}", Name, seriesTitle, airDate.ToShortDateString());
|
|
|
|
|
2011-11-29 06:49:38 +00:00
|
|
|
var searchUrls = GetDailyEpisodeSearchUrls(GetQueryTitle(seriesTitle), airDate);
|
2011-11-26 06:13:47 +00:00
|
|
|
|
2011-12-08 03:54:31 +00:00
|
|
|
var result = Fetch(searchUrls);
|
2011-11-26 06:13:47 +00:00
|
|
|
|
|
|
|
_logger.Info("Finished searching {0} for {1}-{2}, Found {3}", Name, seriesTitle, airDate.ToShortDateString(), result.Count);
|
|
|
|
return result;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
2012-12-21 08:35:20 +00:00
|
|
|
protected virtual List<EpisodeParseResult> Fetch(IEnumerable<string> urls)
|
2011-05-26 04:25:59 +00:00
|
|
|
{
|
|
|
|
var result = new List<EpisodeParseResult>();
|
|
|
|
|
2012-02-01 01:37:36 +00:00
|
|
|
if (!IsConfigured)
|
|
|
|
{
|
|
|
|
_logger.Warn("Indexer '{0}' isn't configured correctly. please reconfigure the indexer in settings page.", Name);
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2011-12-08 03:54:31 +00:00
|
|
|
foreach (var url in urls)
|
2011-05-26 04:25:59 +00:00
|
|
|
{
|
2011-12-08 03:54:31 +00:00
|
|
|
try
|
|
|
|
{
|
|
|
|
_logger.Trace("Downloading RSS " + url);
|
2011-05-26 04:25:59 +00:00
|
|
|
|
2011-12-08 03:54:31 +00:00
|
|
|
var reader = new SyndicationFeedXmlReader(_httpProvider.DownloadStream(url, Credentials));
|
|
|
|
var feed = SyndicationFeed.Load(reader).Items;
|
2011-05-26 04:25:59 +00:00
|
|
|
|
2011-12-08 03:54:31 +00:00
|
|
|
foreach (var item in feed)
|
2011-04-22 06:23:29 +00:00
|
|
|
{
|
2011-12-08 03:54:31 +00:00
|
|
|
try
|
2011-04-22 20:14:02 +00:00
|
|
|
{
|
2011-12-08 03:54:31 +00:00
|
|
|
var parsedEpisode = ParseFeed(item);
|
|
|
|
if (parsedEpisode != null)
|
|
|
|
{
|
|
|
|
parsedEpisode.NzbUrl = NzbDownloadUrl(item);
|
2012-05-02 19:02:39 +00:00
|
|
|
parsedEpisode.NzbInfoUrl = NzbInfoUrl(item);
|
2012-05-08 21:29:24 +00:00
|
|
|
parsedEpisode.Indexer = String.IsNullOrWhiteSpace(parsedEpisode.Indexer) ? Name : parsedEpisode.Indexer;
|
2011-12-08 03:54:31 +00:00
|
|
|
result.Add(parsedEpisode);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
catch (Exception itemEx)
|
|
|
|
{
|
2012-01-19 02:08:17 +00:00
|
|
|
itemEx.Data.Add("FeedUrl", url);
|
|
|
|
itemEx.Data.Add("Item", item.Title);
|
2011-12-08 03:54:31 +00:00
|
|
|
_logger.ErrorException("An error occurred while processing feed item", itemEx);
|
2011-04-22 20:14:02 +00:00
|
|
|
}
|
2011-05-26 04:25:59 +00:00
|
|
|
|
2011-12-08 03:54:31 +00:00
|
|
|
}
|
|
|
|
}
|
2012-02-01 01:37:36 +00:00
|
|
|
catch (WebException webException)
|
2012-01-21 19:36:22 +00:00
|
|
|
{
|
|
|
|
if (webException.Message.Contains("503"))
|
|
|
|
{
|
2012-10-22 21:01:14 +00:00
|
|
|
_logger.Warn("{0} server is currently unavailable.{1} {2}", Name,url, webException.Message);
|
2012-01-21 19:36:22 +00:00
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
webException.Data.Add("FeedUrl", url);
|
2012-02-28 02:35:25 +00:00
|
|
|
_logger.ErrorException("An error occurred while processing feed. " + url, webException);
|
2012-01-21 19:36:22 +00:00
|
|
|
}
|
|
|
|
}
|
2011-12-08 03:54:31 +00:00
|
|
|
catch (Exception feedEx)
|
|
|
|
{
|
2012-01-19 02:08:17 +00:00
|
|
|
feedEx.Data.Add("FeedUrl", url);
|
2012-02-28 02:35:25 +00:00
|
|
|
_logger.ErrorException("An error occurred while processing feed. " + url, feedEx);
|
2011-04-22 06:23:29 +00:00
|
|
|
}
|
2011-04-04 03:50:12 +00:00
|
|
|
}
|
|
|
|
|
2011-05-20 03:47:07 +00:00
|
|
|
return result;
|
2011-04-04 03:50:12 +00:00
|
|
|
}
|
2011-04-19 00:12:06 +00:00
|
|
|
|
2011-04-21 01:26:13 +00:00
|
|
|
/// <summary>
|
2011-05-20 03:47:07 +00:00
|
|
|
/// Parses the RSS feed item
|
2011-04-21 01:26:13 +00:00
|
|
|
/// </summary>
|
|
|
|
/// <param name = "item">RSS feed item to parse</param>
|
|
|
|
/// <returns>Detailed episode info</returns>
|
2011-04-25 20:21:52 +00:00
|
|
|
public EpisodeParseResult ParseFeed(SyndicationItem item)
|
2011-04-19 00:12:06 +00:00
|
|
|
{
|
2012-04-14 23:37:36 +00:00
|
|
|
var title = TitlePreParser(item);
|
|
|
|
|
|
|
|
var episodeParseResult = Parser.ParseTitle(title);
|
2012-04-23 19:33:16 +00:00
|
|
|
if (episodeParseResult != null)
|
|
|
|
{
|
|
|
|
episodeParseResult.Age = DateTime.Now.Date.Subtract(item.PublishDate.Date).Days;
|
|
|
|
episodeParseResult.OriginalString = title;
|
2012-10-17 07:39:06 +00:00
|
|
|
episodeParseResult.SceneSource = true;
|
2012-04-23 19:33:16 +00:00
|
|
|
}
|
2011-04-21 01:26:13 +00:00
|
|
|
|
2012-04-17 03:42:18 +00:00
|
|
|
_logger.Trace("Parsed: {0} from: {1}", episodeParseResult, item.Title.Text);
|
|
|
|
|
2011-05-20 03:47:07 +00:00
|
|
|
return CustomParser(item, episodeParseResult);
|
2011-04-21 01:26:13 +00:00
|
|
|
}
|
2011-05-27 06:03:57 +00:00
|
|
|
|
2012-02-11 08:09:28 +00:00
|
|
|
/// <summary>
|
|
|
|
/// This method can be overwritten to provide indexer specific title cleaning
|
|
|
|
/// </summary>
|
|
|
|
/// <param name="title">Title that needs to be cleaned</param>
|
|
|
|
/// <returns></returns>
|
|
|
|
public virtual string GetQueryTitle(string title)
|
2011-05-27 06:03:57 +00:00
|
|
|
{
|
2012-02-27 05:33:24 +00:00
|
|
|
title = RemoveThe.Replace(title, string.Empty);
|
|
|
|
|
2011-07-03 22:32:36 +00:00
|
|
|
var cleanTitle = TitleSearchRegex.Replace(title, "+").Trim('+', ' ');
|
|
|
|
|
|
|
|
//remove any repeating +s
|
|
|
|
cleanTitle = Regex.Replace(cleanTitle, @"\+{1,100}", "+");
|
|
|
|
return cleanTitle;
|
2011-05-27 06:03:57 +00:00
|
|
|
}
|
2011-04-04 03:50:12 +00:00
|
|
|
}
|
2011-04-10 02:44:01 +00:00
|
|
|
}
|