using System.Net; using System.Text.RegularExpressions; using HtmlAgilityPack; using Logging; using Tranga.TrangaTasks; namespace Tranga.Connectors; public class Manganato : Connector { public override string name { get; } public Manganato(string downloadLocation, string imageCachePath, Logger? logger) : base(downloadLocation, imageCachePath, logger) { this.name = "Manganato"; this.downloadClient = new DownloadClient(new Dictionary() { {(byte)1, 60} }, logger); } public override Publication[] GetPublications(string publicationTitle = "") { logger?.WriteLine(this.GetType().ToString(), $"Getting Publications (title={publicationTitle})"); string sanitizedTitle = string.Concat(Regex.Matches(publicationTitle, "[A-z]* *")).ToLower().Replace(' ', '_'); string requestUrl = $"https://manganato.com/search/story/{sanitizedTitle}"; DownloadClient.RequestResult requestResult = downloadClient.MakeRequest(requestUrl, (byte)1); if (requestResult.statusCode != HttpStatusCode.OK) return Array.Empty(); return ParsePublicationsFromHtml(requestResult.result); } private Publication[] ParsePublicationsFromHtml(Stream html) { StreamReader reader = new (html); string htmlString = reader.ReadToEnd(); HtmlDocument document = new (); document.LoadHtml(htmlString); IEnumerable searchResults = document.DocumentNode.Descendants("div").Where(n => n.HasClass("search-story-item")); List urls = new(); foreach (HtmlNode mangaResult in searchResults) { urls.Add(mangaResult.Descendants("a").First(n => n.HasClass("item-title")).GetAttributes() .First(a => a.Name == "href").Value); } HashSet ret = new(); foreach (string url in urls) { DownloadClient.RequestResult requestResult = downloadClient.MakeRequest(url, (byte)1); if (requestResult.statusCode != HttpStatusCode.OK) return Array.Empty(); ret.Add(ParseSinglePublicationFromHtml(requestResult.result, url.Split('/')[^1])); } return ret.ToArray(); } private Publication ParseSinglePublicationFromHtml(Stream html, string publicationId) { StreamReader reader = new (html); string htmlString = reader.ReadToEnd(); HtmlDocument document = new (); document.LoadHtml(htmlString); string status = ""; Dictionary altTitles = new(); Dictionary? links = null; HashSet tags = new(); string? author = null, originalLanguage = null; int? year = DateTime.Now.Year; HtmlNode infoNode = document.DocumentNode.Descendants("div").First(d => d.HasClass("story-info-right")); string sortName = infoNode.Descendants("h1").First().InnerText; HtmlNode infoTable = infoNode.Descendants().First(d => d.Name == "table"); foreach (HtmlNode row in infoTable.Descendants("tr")) { string key = row.SelectNodes("td").First().InnerText.ToLower(); string value = row.SelectNodes("td").Last().InnerText; string keySanitized = string.Concat(Regex.Matches(key, "[a-z]")); switch (keySanitized) { case "alternative": string[] alts = value.Split(" ; "); for(int i = 0; i < alts.Length; i++) altTitles.Add(i.ToString(), alts[i]); break; case "authors": author = value; break; case "status": status = value; break; case "genres": string[] genres = value.Split(" - "); tags = genres.ToHashSet(); break; default: break; } } string posterUrl = document.DocumentNode.Descendants("span").First(s => s.HasClass("info-image")).Descendants("img").First() .GetAttributes().First(a => a.Name == "src").Value; string coverFileNameInCache = SaveCoverImageToCache(posterUrl, 1); string description = document.DocumentNode.Descendants("div").First(d => d.HasClass("panel-story-info-description")) .InnerText.Replace("Description :", ""); while (description.StartsWith('\n')) description = description.Substring(1); string yearString = document.DocumentNode.Descendants("li").Last(li => li.HasClass("a-h")).Descendants("span") .First(s => s.HasClass("chapter-time")).InnerText; year = Convert.ToInt32(yearString.Split(',')[^1]) + 2000; return new Publication(sortName, author, description, altTitles, tags.ToArray(), posterUrl, coverFileNameInCache, links, year, originalLanguage, status, publicationId); } public override Chapter[] GetChapters(Publication publication, string language = "") { logger?.WriteLine(this.GetType().ToString(), $"Getting Chapters for {publication.sortName} {publication.internalId} (language={language})"); string requestUrl = $"https://chapmanganato.com/{publication.publicationId}"; DownloadClient.RequestResult requestResult = downloadClient.MakeRequest(requestUrl, (byte)1); if (requestResult.statusCode != HttpStatusCode.OK) return Array.Empty(); return ParseChaptersFromHtml(requestResult.result); } private Chapter[] ParseChaptersFromHtml(Stream html) { StreamReader reader = new (html); string htmlString = reader.ReadToEnd(); HtmlDocument document = new (); document.LoadHtml(htmlString); List ret = new(); HtmlNode chapterList = document.DocumentNode.Descendants("ul").First(l => l.HasClass("row-content-chapter")); foreach (HtmlNode chapterInfo in chapterList.Descendants("li")) { string fullString = chapterInfo.Descendants("a").First(d => d.HasClass("chapter-name")).InnerText; string? volumeNumber = fullString.Contains("Vol.") ? fullString.Replace("Vol.", "").Split(' ')[0] : null; string? chapterNumber = fullString.Split(':')[0].Split("Chapter ")[1].Replace('-','.'); string chapterName = string.Concat(fullString.Split(':')[1..]); string url = chapterInfo.Descendants("a").First(d => d.HasClass("chapter-name")) .GetAttributeValue("href", ""); ret.Add(new Chapter(chapterName, volumeNumber, chapterNumber, url)); } ret.Reverse(); return ret.ToArray(); } public override void DownloadChapter(Publication publication, Chapter chapter, DownloadChapterTask parentTask) { logger?.WriteLine(this.GetType().ToString(), $"Downloading Chapter-Info {publication.sortName} {publication.internalId} {chapter.volumeNumber}-{chapter.chapterNumber}"); string requestUrl = chapter.url; DownloadClient.RequestResult requestResult = downloadClient.MakeRequest(requestUrl, (byte)1); if (requestResult.statusCode != HttpStatusCode.OK) return; string[] imageUrls = ParseImageUrlsFromHtml(requestResult.result); string comicInfoPath = Path.GetTempFileName(); File.WriteAllText(comicInfoPath, GetComicInfoXmlString(publication, chapter, logger)); DownloadChapterImages(imageUrls, GetArchiveFilePath(publication, chapter), (byte)1, parentTask, comicInfoPath, "https://chapmanganato.com/"); } private string[] ParseImageUrlsFromHtml(Stream html) { StreamReader reader = new (html); string htmlString = reader.ReadToEnd(); HtmlDocument document = new (); document.LoadHtml(htmlString); List ret = new(); HtmlNode imageContainer = document.DocumentNode.Descendants("div").First(i => i.HasClass("container-chapter-reader")); foreach(HtmlNode imageNode in imageContainer.Descendants("img")) ret.Add(imageNode.GetAttributeValue("src", "")); return ret.ToArray(); } }