using System; using System.Collections.Generic; using System.Diagnostics.CodeAnalysis; using System.Linq; using System.Text; using System.Text.RegularExpressions; using System.Threading.Tasks; using AngleSharp.Html.Parser; using Jackett.Common.Helpers; using Jackett.Common.Models; using Jackett.Common.Models.IndexerConfig; using Jackett.Common.Services.Interfaces; using Jackett.Common.Utils.Clients; using Newtonsoft.Json.Linq; using NLog; using WebClient = Jackett.Common.Utils.Clients.WebClient; namespace Jackett.Common.Indexers { [ExcludeFromCodeCoverage] public class Cinecalidad : BaseWebIndexer { private const int MaxItemsPerPage = 15; private const int MaxSearchPageLimit = 6; // 15 items per page * 6 pages = 90 private string _language; public override string[] LegacySiteLinks { get; protected set; } = { "", "", "", // working but outdated, maybe copycat "", "", "", "", "", "", "" }; public Cinecalidad(IIndexerConfigurationService configService, WebClient wc, Logger l, IProtectionService ps, ICacheService cs) : base(id: "cinecalidad", name: "Cinecalidad", description: "PelĂ­culas Full HD en Castellano y Latino Dual.", link: "", caps: new TorznabCapabilities { MovieSearchParams = new List { MovieSearchParam.Q } }, configService: configService, client: wc, logger: l, p: ps, cacheService: cs, configData: new ConfigurationData()) { Encoding = Encoding.UTF8; Language = "es-ES"; Type = "public"; var language = new ConfigurationData.SingleSelectConfigurationItem( "Select language", new Dictionary { {"castellano", "Castilian Spanish"}, {"latino", "Latin American Spanish"} }) { Value = "castellano" }; configData.AddDynamic("language", language); AddCategoryMapping(1, TorznabCatType.MoviesHD); } public override void LoadValuesFromJson(JToken jsonConfig, bool useProtectionService = false) { { base.LoadValuesFromJson(jsonConfig, useProtectionService); var language = (ConfigurationData.SingleSelectConfigurationItem)configData.GetDynamic("language"); _language = language?.Value ?? "castellano"; } } public override async Task ApplyConfiguration(JToken configJson) { LoadValuesFromJson(configJson); var releases = await PerformQuery(new TorznabQuery()); await ConfigureIfOK(string.Empty, releases.Any(), () => throw new Exception("Could not find release from this URL.")); return IndexerConfigurationStatus.Completed; } protected override async Task> PerformQuery(TorznabQuery query) { var releases = new List(); var templateUrl = SiteLink; if (_language.Equals("castellano")) templateUrl += "espana/"; templateUrl += "{0}?s="; // placeholder for page var maxPages = 2; // we scrape only 2 pages for recent torrents if (!string.IsNullOrWhiteSpace(query.GetQueryString())) { templateUrl += WebUtilityHelpers.UrlEncode(query.GetQueryString(), Encoding.UTF8); maxPages = MaxSearchPageLimit; } var lastPublishDate = DateTime.Now; for (var page = 1; page <= maxPages; page++) { var pageParam = page > 1 ? $"page/{page}/" : ""; var searchUrl = string.Format(templateUrl, pageParam); var response = await RequestWithCookiesAndRetryAsync(searchUrl); var pageReleases = ParseReleases(response, query); // publish date is not available in the torrent list, but we add a relative date so we can sort foreach (var release in pageReleases) { release.PublishDate = lastPublishDate; lastPublishDate = lastPublishDate.AddMinutes(-1); } releases.AddRange(pageReleases); if (pageReleases.Count < MaxItemsPerPage) break; // this is the last page } return releases; } public override async Task Download(Uri link) { var results = await RequestWithCookiesAsync(link.ToString()); try { var parser = new HtmlParser(); var dom = parser.ParseDocument(results.ContentString); var linkParent = dom.QuerySelector("li:contains('Torrent')").ParentElement; var protectedLink = linkParent.GetAttribute("data-res"); if (protectedLink != null) protectedLink = "protect/v.php?i=" + protectedLink; else protectedLink = linkParent.GetAttribute("href"); if (protectedLink.Contains("/")) { // protected link => // var linkParts = protectedLink.Split('='); protectedLink = protectedLink.Replace(linkParts[0] + "=", ""); } protectedLink = GetAbsoluteUrl(protectedLink); results = await RequestWithCookiesAsync(protectedLink); dom = parser.ParseDocument(results.ContentString); var magnetUrl = dom.QuerySelector("a[href^=magnet]").GetAttribute("href"); return await base.Download(new Uri(magnetUrl)); } catch (Exception ex) { OnParseError(results.ContentString, ex); } return null; } private List ParseReleases(WebResult response, TorznabQuery query) { var releases = new List(); try { var parser = new HtmlParser(); var dom = parser.ParseDocument(response.ContentString); var rows = dom.QuerySelectorAll("div.postItem"); foreach (var row in rows) { var qImg = row.QuerySelector("img"); if (qImg == null) continue; // skip results without image var title = qImg.GetAttribute("title"); if (!CheckTitleMatchWords(query.GetQueryString(), title)) continue; // skip if it doesn't contain all words title += _language.Equals("castellano") ? " MULTi/SPANiSH" : " MULTi/LATiN SPANiSH"; title += " 1080p BDRip x264"; var poster = new Uri(GetAbsoluteUrl(qImg.GetAttribute("data-src"))); var link = new Uri(row.QuerySelector("a.postItem__back-link").GetAttribute("href")); var release = new ReleaseInfo { Title = title, Link = link, Details = link, Guid = link, Category = new List { TorznabCatType.MoviesHD.ID }, Poster = poster, Size = 2147483648, // 2 GB Files = 1, Seeders = 1, Peers = 2, DownloadVolumeFactor = 0, UploadVolumeFactor = 1 }; releases.Add(release); } } catch (Exception ex) { OnParseError(response.ContentString, ex); } return releases; } // TODO: merge this method with query.MatchQueryStringAND private static bool CheckTitleMatchWords(string queryStr, string title) { // this code split the words, remove words with 2 letters or less, remove accents and lowercase var queryMatches = Regex.Matches(queryStr, @"\b[\w']*\b"); var queryWords = from m in queryMatches.Cast() where !string.IsNullOrEmpty(m.Value) && m.Value.Length > 2 select Encoding.UTF8.GetString(Encoding.GetEncoding("ISO-8859-8").GetBytes(m.Value.ToLower())); var titleMatches = Regex.Matches(title, @"\b[\w']*\b"); var titleWords = from m in titleMatches.Cast() where !string.IsNullOrEmpty(m.Value) && m.Value.Length > 2 select Encoding.UTF8.GetString(Encoding.GetEncoding("ISO-8859-8").GetBytes(m.Value.ToLower())); titleWords = titleWords.ToArray(); return queryWords.All(word => titleWords.Contains(word)); } private string GetAbsoluteUrl(string url) { url = url.Trim(); if (!url.StartsWith("http")) return SiteLink + url.TrimStart('/'); return url; } } }