Jackett/src/Jackett.Common/Indexers/HDTorrents.cs

262 lines
12 KiB
C#

using System;
using System.Collections.Generic;
using System.Collections.Specialized;
using System.Diagnostics.CodeAnalysis;
using System.Globalization;
using System.Linq;
using System.Text;
using System.Text.RegularExpressions;
using System.Threading.Tasks;
using AngleSharp.Html.Parser;
using Jackett.Common.Models;
using Jackett.Common.Models.IndexerConfig;
using Jackett.Common.Services.Interfaces;
using Jackett.Common.Utils;
using Jackett.Common.Utils.Clients;
using Newtonsoft.Json.Linq;
using NLog;
namespace Jackett.Common.Indexers
{
[ExcludeFromCodeCoverage]
public class HDTorrents : BaseWebIndexer
{
private string SearchUrl => SiteLink + "torrents.php?";
private string LoginUrl => SiteLink + "login.php";
private readonly Regex _posterRegex = new Regex(@"src=\\'./([^']+)\\'", RegexOptions.IgnoreCase);
private readonly HashSet<string> _freeleechRanks = new HashSet<string>(StringComparer.OrdinalIgnoreCase)
{
"VIP",
"Uploader",
"HD Internal",
"Moderator",
"Administrator",
"Owner"
};
public override string[] AlternativeSiteLinks { get; protected set; } =
{
"https://hdts.ru/",
"https://hd-torrents.org/",
"https://hd-torrents.me/"
};
public override string[] LegacySiteLinks { get; protected set; } = {
"https://hd-torrents.net/"
};
private new ConfigurationDataBasicLogin configData => (ConfigurationDataBasicLogin)base.configData;
public HDTorrents(IIndexerConfigurationService configService, WebClient w, Logger l, IProtectionService ps,
ICacheService cs)
: base(id: "hdtorrents",
name: "HD-Torrents",
description: "HD-Torrents is a private torrent website with HD torrents and strict rules on their content.",
link: "https://hdts.ru/", // Domain https://hdts.ru/ seems more reliable
caps: new TorznabCapabilities
{
TvSearchParams = new List<TvSearchParam>
{
TvSearchParam.Q, TvSearchParam.Season, TvSearchParam.Ep, TvSearchParam.ImdbId
},
MovieSearchParams = new List<MovieSearchParam>
{
MovieSearchParam.Q, MovieSearchParam.ImdbId
},
MusicSearchParams = new List<MusicSearchParam>
{
MusicSearchParam.Q
}
},
configService: configService,
client: w,
logger: l,
p: ps,
cacheService: cs,
configData: new ConfigurationDataBasicLogin(
"For best results, change the <b>Torrents per page:</b> setting to <b>100</b> on your account profile."))
{
Encoding = Encoding.UTF8;
Language = "en-US";
Type = "private";
// Movie
AddCategoryMapping("70", TorznabCatType.MoviesUHD, "Movie/UHD/Blu-Ray");
AddCategoryMapping("1", TorznabCatType.MoviesHD, "Movie/Blu-Ray");
AddCategoryMapping("71", TorznabCatType.MoviesUHD, "Movie/UHD/Remux");
AddCategoryMapping("2", TorznabCatType.MoviesHD, "Movie/Remux");
AddCategoryMapping("5", TorznabCatType.MoviesHD, "Movie/1080p/i");
AddCategoryMapping("3", TorznabCatType.MoviesHD, "Movie/720p");
AddCategoryMapping("64", TorznabCatType.MoviesUHD, "Movie/2160p");
AddCategoryMapping("63", TorznabCatType.Audio, "Movie/Audio Track");
// TV Show
AddCategoryMapping("72", TorznabCatType.TVUHD, "TV Show/UHD/Blu-ray");
AddCategoryMapping("59", TorznabCatType.TVHD, "TV Show/Blu-ray");
AddCategoryMapping("73", TorznabCatType.TVUHD, "TV Show/UHD/Remux");
AddCategoryMapping("60", TorznabCatType.TVHD, "TV Show/Remux");
AddCategoryMapping("30", TorznabCatType.TVHD, "TV Show/1080p/i");
AddCategoryMapping("38", TorznabCatType.TVHD, "TV Show/720p");
AddCategoryMapping("65", TorznabCatType.TVUHD, "TV Show/2160p");
// Music
AddCategoryMapping("44", TorznabCatType.Audio, "Music/Album");
AddCategoryMapping("61", TorznabCatType.AudioVideo, "Music/Blu-Ray");
AddCategoryMapping("62", TorznabCatType.AudioVideo, "Music/Remux");
AddCategoryMapping("57", TorznabCatType.AudioVideo, "Music/1080p/i");
AddCategoryMapping("45", TorznabCatType.AudioVideo, "Music/720p");
AddCategoryMapping("66", TorznabCatType.AudioVideo, "Music/2160p");
// XXX
AddCategoryMapping("58", TorznabCatType.XXX, "XXX/Blu-ray");
AddCategoryMapping("74", TorznabCatType.XXX, "XXX/UHD/Blu-ray");
AddCategoryMapping("48", TorznabCatType.XXX, "XXX/1080p/i");
AddCategoryMapping("47", TorznabCatType.XXX, "XXX/720p");
AddCategoryMapping("67", TorznabCatType.XXX, "XXX/2160p");
}
public override async Task<IndexerConfigurationStatus> ApplyConfiguration(JToken configJson)
{
LoadValuesFromJson(configJson);
var loginPage = await RequestWithCookiesAsync(LoginUrl, string.Empty);
var pairs = new Dictionary<string, string> {
{ "uid", configData.Username.Value },
{ "pwd", configData.Password.Value }
};
var result = await RequestLoginAndFollowRedirect(LoginUrl, pairs, loginPage.Cookies, true, null, LoginUrl);
await ConfigureIfOK(
result.Cookies, result.ContentString?.Contains("If your browser doesn't have javascript enabled") == true,
() => throw new ExceptionWithConfigData("Couldn't login", configData));
return IndexerConfigurationStatus.RequiresTesting;
}
protected override async Task<IEnumerable<ReleaseInfo>> PerformQuery(TorznabQuery query)
{
var releases = new List<ReleaseInfo>();
var searchUrl = SearchUrl + string.Join(
string.Empty, MapTorznabCapsToTrackers(query).Select(cat => $"category[]={cat}&"));
var queryCollection = new NameValueCollection
{
{"search", query.ImdbID ?? query.GetQueryString()},
{"active", "0"},
{"options", "0"}
};
// manually url encode parenthesis to prevent "hacking" detection, remove . as not used in titles
searchUrl += queryCollection.GetQueryString().Replace("(", "%28").Replace(")", "%29").Replace(".", " ");
var results = await RequestWithCookiesAndRetryAsync(searchUrl);
try
{
var parser = new HtmlParser();
var dom = parser.ParseDocument(results.ContentString);
var userInfo = dom.QuerySelector("table.navus tr");
var userRank = userInfo.Children[1].TextContent.Replace("Rank:", string.Empty).Trim();
var hasFreeleech = _freeleechRanks.Contains(userRank);
var rows = dom.QuerySelectorAll("table.mainblockcontenttt tr:has(td.mainblockcontent)");
foreach (var row in rows.Skip(1))
{
if (row.Children.Length == 2)
continue; // fix bug with search: cohen
var mainLink = row.Children[2].QuerySelector("a");
var title = mainLink.TextContent;
var details = new Uri(SiteLink + mainLink.GetAttribute("href"));
var posterMatch = _posterRegex.Match(mainLink.GetAttribute("onmouseover"));
var poster = posterMatch.Success ? new Uri(SiteLink + posterMatch.Groups[1].Value.Replace("\\", "/")) : null;
var link = new Uri(SiteLink + row.Children[4].FirstElementChild.GetAttribute("href"));
var description = row.Children[2].QuerySelector("span").TextContent;
var size = ReleaseInfo.GetBytes(row.Children[7].TextContent);
var dateTag = row.Children[6].FirstElementChild;
var dateString = string.Join(" ", dateTag.Attributes.Select(attr => attr.Name));
var publishDate = DateTime.ParseExact(dateString, "dd MMM yyyy HH:mm:ss zz00", CultureInfo.InvariantCulture).ToLocalTime();
var catStr = row.FirstElementChild.FirstElementChild.GetAttribute("href").Split('=')[1];
var cat = MapTrackerCatToNewznab(catStr);
// Sometimes the uploader column is missing, so seeders, leechers, and grabs may be at a different index.
// There's room for improvement, but this works for now.
var endIndex = row.Children.Length;
//Maybe use row.Children.Index(Node) after searching for an element instead?
if (row.Children[endIndex - 1].TextContent == "Edit")
endIndex -= 1;
// moderators get additional delete, recommend and like links
else if (row.Children[endIndex - 4].TextContent == "Edit")
endIndex -= 4;
int? seeders = null;
int? peers = null;
if (ParseUtil.TryCoerceInt(row.Children[endIndex - 3].TextContent, out var rSeeders))
{
seeders = rSeeders;
if (ParseUtil.TryCoerceInt(row.Children[endIndex - 2].TextContent, out var rLeechers))
peers = rLeechers + rSeeders;
}
var grabs = ParseUtil.TryCoerceLong(row.Children[endIndex - 1].TextContent, out var rGrabs)
? (long?)rGrabs
: null;
var dlVolumeFactor = 1.0;
var upVolumeFactor = 1.0;
if (row.QuerySelector("img[src$=\"no_ratio.png\"]") != null)
{
dlVolumeFactor = 0;
upVolumeFactor = 0;
}
else if (hasFreeleech || row.QuerySelector("img[src$=\"free.png\"]") != null)
dlVolumeFactor = 0;
else if (row.QuerySelector("img[src$=\"50.png\"]") != null)
dlVolumeFactor = 0.5;
else if (row.QuerySelector("img[src$=\"25.png\"]") != null)
dlVolumeFactor = 0.75;
else if (row.QuerySelector("img[src$=\"75.png\"]") != null)
dlVolumeFactor = 0.25;
var imdbLink = row.QuerySelector("a[href*=\"www.imdb.com/title/\"]")?.GetAttribute("href");
var imdb = !string.IsNullOrWhiteSpace(imdbLink) ? ParseUtil.GetLongFromString(imdbLink) : null;
var release = new ReleaseInfo
{
Title = title,
Details = details,
Guid = details,
Link = link,
PublishDate = publishDate,
Category = cat,
Description = description,
Poster = poster,
Imdb = imdb,
Size = size,
Grabs = grabs,
Seeders = seeders,
Peers = peers,
DownloadVolumeFactor = dlVolumeFactor,
UploadVolumeFactor = upVolumeFactor,
MinimumRatio = 1,
MinimumSeedTime = 172800 // 48 hours
};
releases.Add(release);
}
}
catch (Exception ex)
{
OnParseError(results.ContentString, ex);
}
return releases;
}
}
}