mirror of
https://github.com/C9Glax/tranga.git
synced 2025-01-12 11:27:32 +01:00
Merge branch 'refs/heads/cuttingedge-merge-ServerV2' into cuttingedge
This commit is contained in:
commit
811a183af2
@ -85,6 +85,7 @@ That is why I wanted to create my own project, in a language I understand, and t
|
|||||||
- Newtonsoft.JSON
|
- Newtonsoft.JSON
|
||||||
- [PuppeteerSharp](https://www.puppeteersharp.com/)
|
- [PuppeteerSharp](https://www.puppeteersharp.com/)
|
||||||
- [Html Agility Pack (HAP)](https://html-agility-pack.net/)
|
- [Html Agility Pack (HAP)](https://html-agility-pack.net/)
|
||||||
|
- [Soenneker.Utils.String.NeedlemanWunsch](https://github.com/soenneker/soenneker.utils.string.needlemanwunsch)
|
||||||
- 💙 Blåhaj 🦈
|
- 💙 Blåhaj 🦈
|
||||||
|
|
||||||
<p align="right">(<a href="#readme-top">back to top</a>)</p>
|
<p align="right">(<a href="#readme-top">back to top</a>)</p>
|
||||||
|
@ -4,6 +4,7 @@ using System.Text.RegularExpressions;
|
|||||||
using System.Xml.Linq;
|
using System.Xml.Linq;
|
||||||
using HtmlAgilityPack;
|
using HtmlAgilityPack;
|
||||||
using Newtonsoft.Json;
|
using Newtonsoft.Json;
|
||||||
|
using Soenneker.Utils.String.NeedlemanWunsch;
|
||||||
using Tranga.Jobs;
|
using Tranga.Jobs;
|
||||||
|
|
||||||
namespace Tranga.MangaConnectors;
|
namespace Tranga.MangaConnectors;
|
||||||
@ -41,14 +42,6 @@ public class Mangasee : MangaConnector
|
|||||||
SearchResult[] filteredResults = FilteredResults(publicationTitle, searchResults);
|
SearchResult[] filteredResults = FilteredResults(publicationTitle, searchResults);
|
||||||
Log($"Total available manga: {searchResults.Length} Filtered down to: {filteredResults.Length}");
|
Log($"Total available manga: {searchResults.Length} Filtered down to: {filteredResults.Length}");
|
||||||
|
|
||||||
/*
|
|
||||||
Dictionary<SearchResult, int> levenshteinRelation = filteredResults.ToDictionary(result => result,
|
|
||||||
result =>
|
|
||||||
{
|
|
||||||
Log($"Levenshtein {result.s}");
|
|
||||||
return LevenshteinDistance(publicationTitle.Replace(" ", "").ToLower(), result.s.Replace(" ", "").ToLower());
|
|
||||||
});
|
|
||||||
Log($"After levenshtein: {levenshteinRelation.Count}");*/
|
|
||||||
|
|
||||||
string[] urls = filteredResults.Select(result => $"https://mangasee123.com/manga/{result.i}").ToArray();
|
string[] urls = filteredResults.Select(result => $"https://mangasee123.com/manga/{result.i}").ToArray();
|
||||||
List<Manga> searchResultManga = new();
|
List<Manga> searchResultManga = new();
|
||||||
@ -70,42 +63,19 @@ public class Mangasee : MangaConnector
|
|||||||
|
|
||||||
private SearchResult[] FilteredResults(string publicationTitle, SearchResult[] unfilteredSearchResults)
|
private SearchResult[] FilteredResults(string publicationTitle, SearchResult[] unfilteredSearchResults)
|
||||||
{
|
{
|
||||||
string[] bannedStrings = {"a", "the", "of", "as", "to", "no", "for", "on", "with", "be", "and", "in", "wa", "at"};
|
Dictionary<SearchResult, int> similarity = new();
|
||||||
string[] cleanSplitPublicationTitle = publicationTitle.Split(' ')
|
foreach (SearchResult sr in unfilteredSearchResults)
|
||||||
.Where(part => part.Length > 0 && !bannedStrings.Contains(part.ToLower())).ToArray();
|
|
||||||
|
|
||||||
return unfilteredSearchResults.Where(usr =>
|
|
||||||
{
|
{
|
||||||
string cleanSearchResultString = string.Join(' ', usr.s.Split(' ').Where(part => part.Length > 0 && !bannedStrings.Contains(part.ToLower())));
|
List<int> scores = new();
|
||||||
foreach(string splitPublicationTitlePart in cleanSplitPublicationTitle)
|
foreach (string se in sr.a)
|
||||||
if (cleanSearchResultString.Contains(splitPublicationTitlePart, StringComparison.InvariantCultureIgnoreCase) ||
|
scores.Add(NeedlemanWunschStringUtil.CalculateSimilarity(se.ToLower(), publicationTitle.ToLower()));
|
||||||
cleanSearchResultString.Contains(splitPublicationTitlePart, StringComparison.InvariantCultureIgnoreCase))
|
scores.Add(NeedlemanWunschStringUtil.CalculateSimilarity(sr.s.ToLower(), publicationTitle.ToLower()));
|
||||||
return true;
|
similarity.Add(sr, scores.Sum() / scores.Count);
|
||||||
return false;
|
|
||||||
}).ToArray();
|
|
||||||
}
|
|
||||||
|
|
||||||
private int LevenshteinDistance(string a, string b)
|
|
||||||
{
|
|
||||||
if (b.Length == 0)
|
|
||||||
return a.Length;
|
|
||||||
if (a.Length == 0)
|
|
||||||
return b.Length;
|
|
||||||
if (a[0] == b[0])
|
|
||||||
return LevenshteinDistance(a[1..], b[1..]);
|
|
||||||
|
|
||||||
int case1 = LevenshteinDistance(a, b[1..]);
|
|
||||||
int case2 = LevenshteinDistance(a[1..], b[1..]);
|
|
||||||
int case3 = LevenshteinDistance(a[1..], b);
|
|
||||||
|
|
||||||
if (case1 < case2)
|
|
||||||
{
|
|
||||||
return 1 + (case1 < case3 ? case1 : case3);
|
|
||||||
}
|
|
||||||
else
|
|
||||||
{
|
|
||||||
return 1 + (case2 < case3 ? case2 : case3);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
SearchResult[] similarity90 = similarity.Where(s => s.Value < 10).Select(s => s.Key).ToArray();
|
||||||
|
|
||||||
|
return similarity90;
|
||||||
}
|
}
|
||||||
|
|
||||||
public override Manga? GetMangaFromId(string publicationId)
|
public override Manga? GetMangaFromId(string publicationId)
|
||||||
|
@ -11,6 +11,7 @@
|
|||||||
<PackageReference Include="HtmlAgilityPack" Version="1.11.46" />
|
<PackageReference Include="HtmlAgilityPack" Version="1.11.46" />
|
||||||
<PackageReference Include="Newtonsoft.Json" Version="13.0.3" />
|
<PackageReference Include="Newtonsoft.Json" Version="13.0.3" />
|
||||||
<PackageReference Include="PuppeteerSharp" Version="10.0.0" />
|
<PackageReference Include="PuppeteerSharp" Version="10.0.0" />
|
||||||
|
<PackageReference Include="Soenneker.Utils.String.NeedlemanWunsch" Version="2.1.301" />
|
||||||
</ItemGroup>
|
</ItemGroup>
|
||||||
|
|
||||||
<ItemGroup>
|
<ItemGroup>
|
||||||
|
Loading…
x
Reference in New Issue
Block a user