mirror of
				https://github.com/Kareadita/Kavita.git
				synced 2025-10-26 16:22:28 -04:00 
			
		
		
		
	Co-authored-by: Copilot Autofix powered by AI <62310815+github-advanced-security[bot]@users.noreply.github.com>
		
			
				
	
	
		
			373 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			C#
		
	
	
	
	
	
			
		
		
	
	
			373 lines
		
	
	
		
			14 KiB
		
	
	
	
		
			C#
		
	
	
	
	
	
| using System;
 | |
| using System.Collections.Generic;
 | |
| using System.IO;
 | |
| using System.Linq;
 | |
| using System.Threading.Tasks;
 | |
| using API.Constants;
 | |
| using API.Data.Repositories;
 | |
| using API.Entities;
 | |
| using API.Entities.Enums;
 | |
| using API.Extensions;
 | |
| using EasyCaching.Core;
 | |
| using Flurl;
 | |
| using Flurl.Http;
 | |
| using HtmlAgilityPack;
 | |
| using Kavita.Common;
 | |
| using Microsoft.Extensions.Hosting;
 | |
| using Microsoft.Extensions.Logging;
 | |
| using NetVips;
 | |
| 
 | |
| namespace API.Services.Tasks.Metadata;
 | |
| 
 | |
| public interface ICoverDbService
 | |
| {
 | |
|     Task<string> DownloadFaviconAsync(string url, EncodeFormat encodeFormat);
 | |
|     Task<string> DownloadPublisherImageAsync(string publisherName, EncodeFormat encodeFormat);
 | |
|     Task<string?> DownloadPersonImageAsync(Person person, EncodeFormat encodeFormat);
 | |
| }
 | |
| 
 | |
| 
 | |
| public class CoverDbService : ICoverDbService
 | |
| {
 | |
|     private readonly ILogger<CoverDbService> _logger;
 | |
|     private readonly IDirectoryService _directoryService;
 | |
|     private readonly IEasyCachingProviderFactory _cacheFactory;
 | |
|     private readonly IHostEnvironment _env;
 | |
| 
 | |
|     private const string NewHost = "https://www.kavitareader.com/CoversDB/";
 | |
| 
 | |
|     private static readonly string[] ValidIconRelations = {
 | |
|         "icon",
 | |
|         "apple-touch-icon",
 | |
|         "apple-touch-icon-precomposed",
 | |
|         "apple-touch-icon icon-precomposed" // ComicVine has it combined
 | |
|     };
 | |
| 
 | |
|     /// <summary>
 | |
|     /// A mapping of urls that need to get the icon from another url, due to strangeness (like app.plex.tv loading a black icon)
 | |
|     /// </summary>
 | |
|     private static readonly Dictionary<string, string> FaviconUrlMapper = new()
 | |
|     {
 | |
|         ["https://app.plex.tv"] = "https://plex.tv"
 | |
|     };
 | |
| 
 | |
|     public CoverDbService(ILogger<CoverDbService> logger, IDirectoryService directoryService,
 | |
|         IEasyCachingProviderFactory cacheFactory, IHostEnvironment env)
 | |
|     {
 | |
|         _logger = logger;
 | |
|         _directoryService = directoryService;
 | |
|         _cacheFactory = cacheFactory;
 | |
|         _env = env;
 | |
|     }
 | |
| 
 | |
|     public async Task<string> DownloadFaviconAsync(string url, EncodeFormat encodeFormat)
 | |
|     {
 | |
|         // Parse the URL to get the domain (including subdomain)
 | |
|         var uri = new Uri(url);
 | |
|         var domain = uri.Host.Replace(Environment.NewLine, string.Empty);
 | |
|         var baseUrl = uri.Scheme + "://" + uri.Host;
 | |
| 
 | |
| 
 | |
|         var provider = _cacheFactory.GetCachingProvider(EasyCacheProfiles.Favicon);
 | |
|         var res = await provider.GetAsync<string>(baseUrl);
 | |
|         if (res.HasValue)
 | |
|         {
 | |
|             var sanitizedBaseUrl = baseUrl.Sanitize();
 | |
|             _logger.LogInformation("Kavita has already tried to fetch from {BaseUrl} and failed. Skipping duplicate check", sanitizedBaseUrl);
 | |
|             throw new KavitaException($"Kavita has already tried to fetch from {sanitizedBaseUrl} and failed. Skipping duplicate check");
 | |
|         }
 | |
| 
 | |
|         await provider.SetAsync(baseUrl, string.Empty, TimeSpan.FromDays(10));
 | |
|         if (FaviconUrlMapper.TryGetValue(baseUrl, out var value))
 | |
|         {
 | |
|             url = value;
 | |
|         }
 | |
| 
 | |
|         var correctSizeLink = string.Empty;
 | |
| 
 | |
|         try
 | |
|         {
 | |
|             var htmlContent = url.GetStringAsync().Result;
 | |
|             var htmlDocument = new HtmlDocument();
 | |
|             htmlDocument.LoadHtml(htmlContent);
 | |
| 
 | |
|             var pngLinks = htmlDocument.DocumentNode.Descendants("link")
 | |
|                 .Where(link => ValidIconRelations.Contains(link.GetAttributeValue("rel", string.Empty)))
 | |
|                 .Select(link => link.GetAttributeValue("href", string.Empty))
 | |
|                 .Where(href => href.Split("?")[0].EndsWith(".png", StringComparison.InvariantCultureIgnoreCase))
 | |
|                 .ToList();
 | |
| 
 | |
|             correctSizeLink = (pngLinks?.Find(pngLink => pngLink.Contains("32")) ?? pngLinks?.FirstOrDefault());
 | |
|         }
 | |
|         catch (Exception ex)
 | |
|         {
 | |
|             _logger.LogError(ex, "Error downloading favicon.png for {Domain}, will try fallback methods", domain);
 | |
|         }
 | |
| 
 | |
|         try
 | |
|         {
 | |
|             if (string.IsNullOrEmpty(correctSizeLink))
 | |
|             {
 | |
|                 correctSizeLink = await FallbackToKavitaReaderFavicon(baseUrl);
 | |
|             }
 | |
|             if (string.IsNullOrEmpty(correctSizeLink))
 | |
|             {
 | |
|                 throw new KavitaException($"Could not grab favicon from {baseUrl}");
 | |
|             }
 | |
| 
 | |
|             var finalUrl = correctSizeLink;
 | |
| 
 | |
|             // If starts with //, it's coming usually from an offsite cdn
 | |
|             if (correctSizeLink.StartsWith("//"))
 | |
|             {
 | |
|                 finalUrl = "https:" + correctSizeLink;
 | |
|             }
 | |
|             else if (!correctSizeLink.StartsWith(uri.Scheme))
 | |
|             {
 | |
|                 finalUrl = Url.Combine(baseUrl, correctSizeLink);
 | |
|             }
 | |
| 
 | |
|             _logger.LogTrace("Fetching favicon from {Url}", finalUrl);
 | |
|             // Download the favicon.ico file using Flurl
 | |
|             var faviconStream = await finalUrl
 | |
|                 .AllowHttpStatus("2xx,304")
 | |
|                 .GetStreamAsync();
 | |
| 
 | |
|             // Create the destination file path
 | |
|             using var image = Image.PngloadStream(faviconStream);
 | |
|             var filename = ImageService.GetWebLinkFormat(baseUrl, encodeFormat);
 | |
|             switch (encodeFormat)
 | |
|             {
 | |
|                 case EncodeFormat.PNG:
 | |
|                     image.Pngsave(Path.Combine(_directoryService.FaviconDirectory, filename));
 | |
|                     break;
 | |
|                 case EncodeFormat.WEBP:
 | |
|                     image.Webpsave(Path.Combine(_directoryService.FaviconDirectory, filename));
 | |
|                     break;
 | |
|                 case EncodeFormat.AVIF:
 | |
|                     image.Heifsave(Path.Combine(_directoryService.FaviconDirectory, filename));
 | |
|                     break;
 | |
|                 default:
 | |
|                     throw new ArgumentOutOfRangeException(nameof(encodeFormat), encodeFormat, null);
 | |
|             }
 | |
| 
 | |
| 
 | |
|             _logger.LogDebug("Favicon for {Domain} downloaded and saved successfully", domain);
 | |
|             return filename;
 | |
|         } catch (Exception ex)
 | |
|         {
 | |
|             _logger.LogError(ex, "Error downloading favicon for {Domain}", domain);
 | |
|             throw;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     public async Task<string> DownloadPublisherImageAsync(string publisherName, EncodeFormat encodeFormat)
 | |
|     {
 | |
|         try
 | |
|         {
 | |
|             var publisherLink = await FallbackToKavitaReaderPublisher(publisherName);
 | |
|             if (string.IsNullOrEmpty(publisherLink))
 | |
|             {
 | |
|                 throw new KavitaException($"Could not grab publisher image for {publisherName}");
 | |
|             }
 | |
| 
 | |
|             _logger.LogTrace("Fetching publisher image from {Url}", publisherLink.Sanitize());
 | |
|             // Download the publisher file using Flurl
 | |
|             var publisherStream = await publisherLink
 | |
|                 .AllowHttpStatus("2xx,304")
 | |
|                 .GetStreamAsync();
 | |
| 
 | |
|             // Create the destination file path
 | |
|             using var image = Image.NewFromStream(publisherStream);
 | |
|             var filename = ImageService.GetPublisherFormat(publisherName, encodeFormat);
 | |
|             switch (encodeFormat)
 | |
|             {
 | |
|                 case EncodeFormat.PNG:
 | |
|                     image.Pngsave(Path.Combine(_directoryService.PublisherDirectory, filename));
 | |
|                     break;
 | |
|                 case EncodeFormat.WEBP:
 | |
|                     image.Webpsave(Path.Combine(_directoryService.PublisherDirectory, filename));
 | |
|                     break;
 | |
|                 case EncodeFormat.AVIF:
 | |
|                     image.Heifsave(Path.Combine(_directoryService.PublisherDirectory, filename));
 | |
|                     break;
 | |
|                 default:
 | |
|                     throw new ArgumentOutOfRangeException(nameof(encodeFormat), encodeFormat, null);
 | |
|             }
 | |
| 
 | |
| 
 | |
|             _logger.LogDebug("Publisher image for {PublisherName} downloaded and saved successfully", publisherName.Sanitize());
 | |
|             return filename;
 | |
|         } catch (Exception ex)
 | |
|         {
 | |
|             _logger.LogError(ex, "Error downloading image for {PublisherName}", publisherName.Sanitize());
 | |
|             throw;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     /// <summary>
 | |
|     /// Attempts to download the Person image from CoverDB while matching against metadata within the Person
 | |
|     /// </summary>
 | |
|     /// <param name="person"></param>
 | |
|     /// <param name="encodeFormat"></param>
 | |
|     /// <returns>Person image (in correct directory) or null if not found/error</returns>
 | |
|     public async Task<string?> DownloadPersonImageAsync(Person person, EncodeFormat encodeFormat)
 | |
|     {
 | |
|         try
 | |
|         {
 | |
|             var personImageLink = await GetCoverPersonImagePath(person);
 | |
|             if (string.IsNullOrEmpty(personImageLink))
 | |
|             {
 | |
|                 throw new KavitaException($"Could not grab person image for {person.Name}");
 | |
|             }
 | |
| 
 | |
|             // Create the destination file path
 | |
|             var filename = ImageService.GetPersonFormat(person.Id) + encodeFormat.GetExtension();
 | |
|             var targetFile = Path.Combine(_directoryService.CoverImageDirectory, filename);
 | |
| 
 | |
|             // Ensure if file exists, we delete to overwrite
 | |
| 
 | |
| 
 | |
|             _logger.LogTrace("Fetching publisher image from {Url}", personImageLink.Sanitize());
 | |
|             // Download the publisher file using Flurl
 | |
|             var personStream = await personImageLink
 | |
|                 .AllowHttpStatus("2xx,304")
 | |
|                 .GetStreamAsync();
 | |
| 
 | |
|             using var image = Image.NewFromStream(personStream);
 | |
|             switch (encodeFormat)
 | |
|             {
 | |
|                 case EncodeFormat.PNG:
 | |
|                     image.Pngsave(targetFile);
 | |
|                     break;
 | |
|                 case EncodeFormat.WEBP:
 | |
|                     image.Webpsave(targetFile);
 | |
|                     break;
 | |
|                 case EncodeFormat.AVIF:
 | |
|                     image.Heifsave(targetFile);
 | |
|                     break;
 | |
|                 default:
 | |
|                     throw new ArgumentOutOfRangeException(nameof(encodeFormat), encodeFormat, null);
 | |
|             }
 | |
| 
 | |
|             _logger.LogDebug("Person image for {PersonName} downloaded and saved successfully", person.Name);
 | |
| 
 | |
|             return filename;
 | |
|         } catch (Exception ex)
 | |
|         {
 | |
|             _logger.LogError(ex, "Error downloading image for {PersonName}", person.Name);
 | |
|         }
 | |
| 
 | |
|         return null;
 | |
|     }
 | |
| 
 | |
|     private async Task<string> GetCoverPersonImagePath(Person person)
 | |
|     {
 | |
|         var tempFile = Path.Join(_directoryService.TempDirectory, "people.yml");
 | |
| 
 | |
|         // Check if the file already exists and skip download in Development environment
 | |
|         if (File.Exists(tempFile))
 | |
|         {
 | |
|             if (_env.IsDevelopment())
 | |
|             {
 | |
|                 _logger.LogInformation("Using existing people.yml file in Development environment");
 | |
|             }
 | |
|             else
 | |
|             {
 | |
|                 // Remove file if not in Development and file is older than 7 days
 | |
|                 if (File.GetLastWriteTime(tempFile) < DateTime.Now.AddDays(-7))
 | |
|                 {
 | |
|                     File.Delete(tempFile);
 | |
|                 }
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         // Download the file if it doesn't exist or was deleted due to age
 | |
|         if (!File.Exists(tempFile))
 | |
|         {
 | |
|             var masterPeopleFile = await $"{NewHost}people/people.yml"
 | |
|                 .DownloadFileAsync(_directoryService.TempDirectory);
 | |
| 
 | |
|             if (!File.Exists(tempFile) || string.IsNullOrEmpty(masterPeopleFile))
 | |
|             {
 | |
|                 _logger.LogError("Could not download people.yml from Github");
 | |
|                 return null;
 | |
|             }
 | |
|         }
 | |
| 
 | |
| 
 | |
|         var coverDbRepository = new CoverDbRepository(tempFile);
 | |
| 
 | |
|         var coverAuthor = coverDbRepository.FindBestAuthorMatch(person);
 | |
|         if (coverAuthor == null || string.IsNullOrEmpty(coverAuthor.ImagePath))
 | |
|         {
 | |
|             throw new KavitaException($"Could not grab person image for {person.Name}");
 | |
|         }
 | |
| 
 | |
|         return $"{NewHost}{coverAuthor.ImagePath}";
 | |
|     }
 | |
| 
 | |
|     private static async Task<string> FallbackToKavitaReaderFavicon(string baseUrl)
 | |
|     {
 | |
|         var correctSizeLink = string.Empty;
 | |
|         // TODO: Pull this down and store it in temp/ to save on requests
 | |
|         var allOverrides = await $"{NewHost}favicons/urls.txt"
 | |
|             .GetStringAsync();
 | |
| 
 | |
|         if (!string.IsNullOrEmpty(allOverrides))
 | |
|         {
 | |
|             var cleanedBaseUrl = baseUrl.Replace("https://", string.Empty);
 | |
|             var externalFile = allOverrides
 | |
|                 .Split("\n")
 | |
|                 .FirstOrDefault(url =>
 | |
|                     cleanedBaseUrl.Equals(url.Replace(".png", string.Empty)) ||
 | |
|                     cleanedBaseUrl.Replace("www.", string.Empty).Equals(url.Replace(".png", string.Empty)
 | |
|                     ));
 | |
| 
 | |
|             if (string.IsNullOrEmpty(externalFile))
 | |
|             {
 | |
|                 throw new KavitaException($"Could not grab favicon from {baseUrl.Sanitize()}");
 | |
|             }
 | |
| 
 | |
|             correctSizeLink = $"{NewHost}favicons/" + externalFile;
 | |
|         }
 | |
| 
 | |
|         return correctSizeLink;
 | |
|     }
 | |
| 
 | |
|     private static async Task<string> FallbackToKavitaReaderPublisher(string publisherName)
 | |
|     {
 | |
|         var externalLink = string.Empty;
 | |
|         // TODO: Pull this down and store it in temp/ to save on requests
 | |
|         var allOverrides = await $"{NewHost}publishers/publishers.txt".GetStringAsync();
 | |
| 
 | |
|         if (!string.IsNullOrEmpty(allOverrides))
 | |
|         {
 | |
|             var externalFile = allOverrides
 | |
|                 .Split("\n")
 | |
|                 .Select(publisherLine =>
 | |
|                 {
 | |
|                     var tokens = publisherLine.Split("|");
 | |
|                     if (tokens.Length != 2) return null;
 | |
|                     var aliases = tokens[0];
 | |
|                     // Multiple publisher aliases are separated by #
 | |
|                     if (aliases.Split("#").Any(name => name.ToLowerInvariant().Trim().Equals(publisherName.ToLowerInvariant().Trim())))
 | |
|                     {
 | |
|                         return tokens[1];
 | |
|                     }
 | |
|                     return null;
 | |
|                 })
 | |
|                 .FirstOrDefault(url => !string.IsNullOrEmpty(url));
 | |
| 
 | |
|             if (string.IsNullOrEmpty(externalFile))
 | |
|             {
 | |
|                 throw new KavitaException($"Could not grab publisher image for {publisherName}");
 | |
|             }
 | |
| 
 | |
|             externalLink = $"{NewHost}publishers/" + externalFile;
 | |
|         }
 | |
| 
 | |
|         return externalLink;
 | |
|     }
 | |
| }
 |