Jackett/src/Jackett.Common/Indexers/BakaBT.cs

280 lines
12 KiB
C#
Raw Normal View History

2020-02-09 02:35:16 +00:00
using System;
2016-09-04 08:25:33 +00:00
using System.Collections.Generic;
using System.Diagnostics.CodeAnalysis;
2016-09-04 08:25:33 +00:00
using System.Globalization;
using System.Linq;
using System.Net;
2016-09-04 08:25:33 +00:00
using System.Text;
using System.Text.RegularExpressions;
2016-09-04 08:25:33 +00:00
using System.Threading.Tasks;
using AngleSharp.Dom;
using AngleSharp.Html.Parser;
using Jackett.Common.Models;
using Jackett.Common.Models.IndexerConfig.Bespoke;
using Jackett.Common.Services.Interfaces;
using Jackett.Common.Utils.Clients;
using Newtonsoft.Json.Linq;
using NLog;
2016-09-04 08:25:33 +00:00
namespace Jackett.Common.Indexers
2016-09-04 08:25:33 +00:00
{
[ExcludeFromCodeCoverage]
public class BakaBT : BaseWebIndexer
2016-09-04 08:25:33 +00:00
{
private string SearchUrl => SiteLink + "browse.php?only=0&hentai=1&incomplete=1&lossless=1&hd=1&multiaudio=1&bonus=1&reorder=1&q=";
private string LoginUrl => SiteLink + "login.php";
private readonly string LogoutStr = "<a href=\"logout.php\">Logout</a>";
private bool AddRomajiTitle => configData.AddRomajiTitle.Value;
private bool AppendSeason => configData.AppendSeason.Value;
2016-09-04 08:25:33 +00:00
private readonly List<int> defaultCategories = new List<int> { TorznabCatType.TVAnime.ID };
private new ConfigurationDataBakaBT configData
2016-09-04 08:25:33 +00:00
{
get => (ConfigurationDataBakaBT)base.configData;
set => base.configData = value;
2016-09-04 08:25:33 +00:00
}
public BakaBT(IIndexerConfigurationService configService, Utils.Clients.WebClient wc, Logger l, IProtectionService ps)
: base(id: "bakabt",
name: "BakaBT",
description: "Anime Comunity",
link: "https://bakabt.me/",
caps: new TorznabCapabilities
{
// TODO: add music and book search
TvSearchParams = new List<TvSearchParam>
{
TvSearchParam.Q, TvSearchParam.Season, TvSearchParam.Ep
}
},
configService: configService,
client: wc,
logger: l,
p: ps,
configData: new ConfigurationDataBakaBT("To prevent 0-results-error, Enable the " +
"Show-Adult-Content option in your BakaBT account Settings."))
2016-09-04 08:25:33 +00:00
{
2016-12-09 17:20:58 +00:00
Encoding = Encoding.UTF8;
Language = "en-us";
Type = "private";
AddCategoryMapping(1, TorznabCatType.TVAnime, "Anime Series");
AddCategoryMapping(2, TorznabCatType.TVAnime, "OVA");
AddCategoryMapping(3, TorznabCatType.AudioOther, "Soundtrack");
AddCategoryMapping(4, TorznabCatType.BooksComics, "Manga");
AddCategoryMapping(5, TorznabCatType.TVAnime, "Anime Movie");
AddCategoryMapping(6, TorznabCatType.TVOTHER, "Live Action");
AddCategoryMapping(7, TorznabCatType.BooksOther, "Artbook");
AddCategoryMapping(8, TorznabCatType.AudioVideo, "Music Video");
AddCategoryMapping(9, TorznabCatType.BooksEbook, "Light Novel");
2016-09-04 08:25:33 +00:00
}
public override async Task<IndexerConfigurationStatus> ApplyConfiguration(JToken configJson)
2016-09-04 08:25:33 +00:00
{
LoadValuesFromJson(configJson);
await DoLogin();
return IndexerConfigurationStatus.RequiresTesting;
}
2016-09-04 08:25:33 +00:00
private async Task DoLogin()
{
var loginForm = await webclient.GetResultAsync(new Utils.Clients.WebRequest()
{
Url = LoginUrl,
Type = RequestType.GET
});
2016-09-04 08:25:33 +00:00
var pairs = new Dictionary<string, string> {
{ "username", configData.Username.Value },
{ "password", configData.Password.Value },
{ "returnto", "/index.php" }
};
var parser = new HtmlParser();
var dom = parser.ParseDocument(loginForm.ContentString);
var loginKey = dom.QuerySelector("input[name=\"loginKey\"]");
if (loginKey != null)
pairs["loginKey"] = loginKey.GetAttribute("value");
2016-09-04 08:25:33 +00:00
var response = await RequestLoginAndFollowRedirect(LoginUrl, pairs, loginForm.Cookies, true, null, SiteLink);
var responseContent = response.ContentString;
await ConfigureIfOK(response.Cookies, responseContent.Contains(LogoutStr), () =>
{
var parser = new HtmlParser();
var dom = parser.ParseDocument(responseContent);
var messageEl = dom.QuerySelectorAll(".error").First();
var errorMessage = messageEl.Text().Trim();
throw new ExceptionWithConfigData(errorMessage, configData);
});
2016-09-04 08:25:33 +00:00
}
protected override async Task<IEnumerable<ReleaseInfo>> PerformQuery(TorznabQuery query)
2016-09-04 08:25:33 +00:00
{
var searchString = query.SanitizedSearchTerm;
var match = Regex.Match(query.SanitizedSearchTerm, @".*(?=\s(?:[Ee]\d+|\d+)$)");
if (match.Success)
searchString = match.Value;
2016-09-04 08:25:33 +00:00
var releases = new List<ReleaseInfo>();
var episodeSearchUrl = SearchUrl + WebUtility.UrlEncode(searchString);
var response = await RequestWithCookiesAndRetryAsync(episodeSearchUrl);
if (!response.ContentString.Contains(LogoutStr))
{
//Cookie appears to expire after a period of time or logging in to the site via browser
await DoLogin();
response = await RequestWithCookiesAndRetryAsync(episodeSearchUrl);
}
2016-09-04 08:25:33 +00:00
try
{
var parser = new HtmlParser();
var dom = parser.ParseDocument(response.ContentString);
var rows = dom.QuerySelectorAll(".torrents tr.torrent, .torrents tr.torrent_alt");
ICollection<int> currentCategories = new List<int> { TorznabCatType.TVAnime.ID };
2016-09-04 08:25:33 +00:00
foreach (var row in rows)
{
var qTitleLink = row.QuerySelector("a.title, a.alt_title");
if (qTitleLink == null)
continue;
var title = qTitleLink.TextContent.Trim();
2016-09-04 08:25:33 +00:00
// Insert before the release info
var taidx = title.IndexOf('(');
var tbidx = title.IndexOf('[');
if (taidx == -1)
taidx = title.Length;
if (tbidx == -1)
tbidx = title.Length;
var titleSplit = Math.Min(taidx, tbidx);
var titleSeries = title.Substring(0, titleSplit);
var releaseInfo = title.Substring(titleSplit);
currentCategories = GetNextCategory(row, currentCategories);
var stringSeparator = new string[] { " | " };
var titles = titleSeries.Split(stringSeparator, StringSplitOptions.RemoveEmptyEntries);
if (titles.Count() > 1 && !AddRomajiTitle)
titles = titles.Skip(1).ToArray();
foreach (var name in titles)
2016-09-04 08:25:33 +00:00
{
var release = new ReleaseInfo();
release.Title = (name + releaseInfo).Trim();
// Ensure the season is defined as this tracker only deals with full seasons
if (release.Title.IndexOf("Season") == -1 && AppendSeason)
2016-09-04 08:25:33 +00:00
{
// Insert before the release info
var aidx = release.Title.IndexOf('(');
var bidx = release.Title.IndexOf('[');
if (aidx == -1)
aidx = release.Title.Length;
if (bidx == -1)
bidx = release.Title.Length;
var insertPoint = Math.Min(aidx, bidx);
release.Title = release.Title.Substring(0, insertPoint) + " Season 1 " + release.Title.Substring(insertPoint);
2016-09-04 08:25:33 +00:00
}
release.Category = currentCategories;
release.Description = row.QuerySelector("span.tags")?.TextContent;
release.Guid = new Uri(SiteLink + qTitleLink.GetAttribute("href"));
2016-09-04 08:25:33 +00:00
release.Comments = release.Guid;
release.Link = new Uri(SiteLink + row.QuerySelector(".peers a").GetAttribute("href"));
2018-12-28 17:19:27 +00:00
var grabs = row.QuerySelectorAll(".peers")[0].FirstChild.NodeValue.TrimEnd().TrimEnd('/').TrimEnd();
2018-12-28 17:19:27 +00:00
grabs = grabs.Replace("k", "000");
release.Grabs = int.Parse(grabs);
release.Seeders = int.Parse(row.QuerySelectorAll(".peers a")[0].TextContent);
release.Peers = release.Seeders + int.Parse(row.QuerySelectorAll(".peers a")[1].TextContent);
2016-09-04 08:25:33 +00:00
release.MinimumRatio = 1;
release.MinimumSeedTime = 172800; // 48 hours
2016-09-04 08:25:33 +00:00
var size = row.QuerySelector(".size").TextContent;
2016-09-04 08:25:33 +00:00
release.Size = ReleaseInfo.GetBytes(size);
//22 Jul 15
var dateStr = row.QuerySelector(".added").TextContent.Replace("'", string.Empty);
2016-09-04 08:25:33 +00:00
if (dateStr.Split(' ')[0].Length == 1)
dateStr = "0" + dateStr;
if (string.Equals(dateStr, "yesterday", StringComparison.InvariantCultureIgnoreCase))
release.PublishDate = DateTime.Now.AddDays(-1);
else if (string.Equals(dateStr, "today", StringComparison.InvariantCultureIgnoreCase))
release.PublishDate = DateTime.Now;
else
release.PublishDate = DateTime.ParseExact(dateStr, "dd MMM yy", CultureInfo.InvariantCulture);
release.DownloadVolumeFactor = row.QuerySelector("span.freeleech") != null ? 0 : 1;
2018-12-28 17:09:59 +00:00
release.UploadVolumeFactor = 1;
2016-09-04 08:25:33 +00:00
releases.Add(release);
}
2016-09-04 08:25:33 +00:00
}
}
catch (Exception ex)
{
OnParseError(response.ContentString, ex);
2016-09-04 08:25:33 +00:00
}
return releases;
}
private ICollection<int> GetNextCategory(IElement row, ICollection<int> currentCategories)
{
string nextCategoryName = GetCategoryName(row);
if (nextCategoryName != null)
{
currentCategories = MapTrackerCatDescToNewznab(nextCategoryName);
if (currentCategories.Count == 0)
return defaultCategories;
}
return currentCategories;
}
private string GetCategoryName(IElement row)
{
var categoryElement = row.QuerySelector("td.category span");
if (categoryElement == null)
{
return null;
}
var categoryName = categoryElement.GetAttribute("title");
if (!string.IsNullOrWhiteSpace(categoryName))
{
return categoryName;
}
return null;
}
2016-09-04 08:25:33 +00:00
public override async Task<byte[]> Download(Uri link)
{
var downloadPage = await RequestWithCookiesAsync(link.ToString());
var parser = new HtmlParser();
var dom = parser.ParseDocument(downloadPage.ContentString);
var downloadLink = dom.QuerySelectorAll(".download_link").First().GetAttribute("href");
2016-09-04 08:25:33 +00:00
if (string.IsNullOrWhiteSpace(downloadLink))
throw new Exception("Unable to find download link.");
var response = await RequestWithCookiesAsync(SiteLink + downloadLink);
return response.ContentBytes;
2016-09-04 08:25:33 +00:00
}
}
2020-02-09 02:35:16 +00:00
}