using System; using System.Collections.Concurrent; using System.Collections.Generic; using System.Collections.Immutable; using System.Diagnostics; using System.IO; using System.Linq; using System.Threading.Tasks; using API.Entities; using API.Entities.Enums; using API.Interfaces; using API.Parser; using Hangfire; using Microsoft.Extensions.Logging; namespace API.Services { public class ScannerService : IScannerService { private readonly IUnitOfWork _unitOfWork; private readonly ILogger _logger; private readonly IArchiveService _archiveService; private ConcurrentDictionary> _scannedSeries; private bool _forceUpdate; public ScannerService(IUnitOfWork unitOfWork, ILogger logger, IArchiveService archiveService) { _unitOfWork = unitOfWork; _logger = logger; _archiveService = archiveService; } [DisableConcurrentExecution(timeoutInSeconds: 120)] public void ScanLibraries() { var libraries = Task.Run(() => _unitOfWork.LibraryRepository.GetLibrariesAsync()).Result.ToList(); foreach (var lib in libraries) { ScanLibrary(lib.Id, false); } } private bool ShouldSkipFolderScan(FolderPath folder, ref int skippedFolders) { // NOTE: This solution isn't the best, but it has potential. We need to handle a few other cases so it works great. return false; // if (/*_environment.IsProduction() && */!_forceUpdate && Directory.GetLastWriteTime(folder.Path) < folder.LastScanned) // { // _logger.LogDebug($"{folder.Path} hasn't been updated since last scan. Skipping."); // skippedFolders += 1; // return true; // } // // return false; } private void Cleanup() { _scannedSeries = null; _forceUpdate = false; } [DisableConcurrentExecution(timeoutInSeconds: 120)] public void ScanLibrary(int libraryId, bool forceUpdate) { _forceUpdate = forceUpdate; var sw = Stopwatch.StartNew(); Library library; try { library = Task.Run(() => _unitOfWork.LibraryRepository.GetLibraryForIdAsync(libraryId)).Result; } catch (Exception ex) { // This usually only fails if user is not authenticated. _logger.LogError($"There was an issue fetching Library {libraryId}.", ex); return; } _scannedSeries = new ConcurrentDictionary>(); _logger.LogInformation($"Beginning scan on {library.Name}. Forcing metadata update: {forceUpdate}"); var totalFiles = 0; var skippedFolders = 0; foreach (var folderPath in library.Folders) { if (ShouldSkipFolderScan(folderPath, ref skippedFolders)) continue; try { totalFiles += DirectoryService.TraverseTreeParallelForEach(folderPath.Path, (f) => { try { ProcessFile(f, folderPath.Path); } catch (FileNotFoundException exception) { _logger.LogError(exception, $"The file {f} could not be found"); } }); } catch (ArgumentException ex) { _logger.LogError(ex, $"The directory '{folderPath.Path}' does not exist"); } folderPath.LastScanned = DateTime.Now; } var scanElapsedTime = sw.ElapsedMilliseconds; _logger.LogInformation("Folders Scanned {0} files in {1} milliseconds", totalFiles, scanElapsedTime); sw.Restart(); if (skippedFolders == library.Folders.Count) { _logger.LogInformation("All Folders were skipped due to no modifications to the directories."); _unitOfWork.LibraryRepository.Update(library); _logger.LogInformation("Processed {0} files in {1} milliseconds for {2}", totalFiles, sw.ElapsedMilliseconds, library.Name); Cleanup(); return; } // Remove any series where there were no parsed infos var filtered = _scannedSeries.Where(kvp => kvp.Value.Count != 0); var series = filtered.ToImmutableDictionary(v => v.Key, v => v.Value); UpdateLibrary(libraryId, series, library); _unitOfWork.LibraryRepository.Update(library); if (Task.Run(() => _unitOfWork.Complete()).Result) { _logger.LogInformation($"Scan completed on {library.Name}. Parsed {series.Keys.Count()} series in {sw.ElapsedMilliseconds} ms."); } else { _logger.LogError("There was a critical error that resulted in a failed scan. Please check logs and rescan."); } _logger.LogInformation("Processed {0} files in {1} milliseconds for {2}", totalFiles, sw.ElapsedMilliseconds + scanElapsedTime, library.Name); Cleanup(); } private void UpdateLibrary(int libraryId, ImmutableDictionary> parsedSeries, Library library) { var allSeries = Task.Run(() => _unitOfWork.SeriesRepository.GetSeriesForLibraryIdAsync(libraryId)).Result.ToList(); _logger.LogInformation($"Updating Library {library.Name}"); // Perform DB activities UpsertSeries(library, parsedSeries, allSeries); // Remove series that are no longer on disk RemoveSeriesNotOnDisk(allSeries, parsedSeries, library); foreach (var folder in library.Folders) folder.LastScanned = DateTime.Now; } private void UpsertSeries(Library library, ImmutableDictionary> parsedSeries, IList allSeries) { // NOTE: This is a great point to break the parsing into threads and join back. Each thread can take X series. foreach (var seriesKey in parsedSeries.Keys) { var mangaSeries = ExistingOrDefault(library, allSeries, seriesKey) ?? new Series { Name = seriesKey, OriginalName = seriesKey, NormalizedName = Parser.Parser.Normalize(seriesKey), SortName = seriesKey, Summary = "" }; mangaSeries.NormalizedName = Parser.Parser.Normalize(seriesKey); try { UpdateSeries(ref mangaSeries, parsedSeries[seriesKey].ToArray()); if (!library.Series.Any(s => s.NormalizedName == mangaSeries.NormalizedName)) { _logger.LogInformation($"Added series {mangaSeries.Name}"); library.Series.Add(mangaSeries); } } catch (Exception ex) { _logger.LogError(ex, $"There was an error during scanning of library. {seriesKey} will be skipped."); } } } private void RemoveSeriesNotOnDisk(IEnumerable allSeries, ImmutableDictionary> series, Library library) { _logger.LogInformation("Removing any series that are no longer on disk."); var count = 0; var foundSeries = series.Select(s => Parser.Parser.Normalize(s.Key)).ToList(); var missingSeries = allSeries.Where(existingSeries => !foundSeries.Contains(existingSeries.NormalizedName) || !series.ContainsKey(existingSeries.Name) || !series.ContainsKey(existingSeries.OriginalName)); foreach (var existingSeries in missingSeries) { // Delete series, there is no file to backup any longer. library.Series?.Remove(existingSeries); count++; } _logger.LogInformation($"Removed {count} series that are no longer on disk"); } /// /// Attempts to either add a new instance of a show mapping to the scannedSeries bag or adds to an existing. /// /// private void TrackSeries(ParserInfo info) { if (info.Series == string.Empty) return; _scannedSeries.AddOrUpdate(info.Series, new List() {info}, (_, oldValue) => { oldValue ??= new List(); if (!oldValue.Contains(info)) { oldValue.Add(info); } return oldValue; }); } /// /// Processes files found during a library scan. /// Populates a collection of for DB updates later. /// /// Path of a file /// private void ProcessFile(string path, string rootPath) { var info = Parser.Parser.Parse(path, rootPath); if (info == null) { _logger.LogWarning($"Could not parse from {path}"); return; } TrackSeries(info); } private void UpdateSeries(ref Series series, ParserInfo[] infos) { _logger.LogInformation($"Updating entries for {series.Name}. {infos.Length} related files."); UpdateVolumes(series, infos); series.Pages = series.Volumes.Sum(v => v.Pages); if (ShouldFindCoverImage(series.CoverImage)) { var firstCover = series.Volumes.OrderBy(x => x.Number).FirstOrDefault(x => x.Number != 0); if (firstCover == null && series.Volumes.Any()) { firstCover = series.Volumes.FirstOrDefault(x => x.Number == 0); } series.CoverImage = firstCover?.CoverImage; } if (string.IsNullOrEmpty(series.Summary) || _forceUpdate) { series.Summary = ""; } _logger.LogDebug($"Created {series.Volumes.Count} volumes on {series.Name}"); } private MangaFile CreateMangaFile(ParserInfo info) { return new MangaFile() { FilePath = info.FullFilePath, Format = info.Format, NumberOfPages = info.Format == MangaFormat.Archive ? _archiveService.GetNumberOfPagesFromArchive(info.FullFilePath): 1 }; } private bool ShouldFindCoverImage(byte[] coverImage) { return _forceUpdate || coverImage == null || !coverImage.Any(); } private void UpdateChapters(Volume volume, IEnumerable infos) // ICollection { volume.Chapters ??= new List(); foreach (var info in infos) { try { var chapter = volume.Chapters.SingleOrDefault(c => c.Range == info.Chapters) ?? new Chapter() { Number = Parser.Parser.MinimumNumberFromRange(info.Chapters) + "", Range = info.Chapters, }; AddOrUpdateFileForChapter(chapter, info); chapter.Number = Parser.Parser.MinimumNumberFromRange(info.Chapters) + ""; chapter.Range = info.Chapters; if (volume.Chapters.All(c => c.Range != info.Chapters)) { volume.Chapters.Add(chapter); } } catch (Exception ex) { _logger.LogWarning(ex, $"There was an exception parsing {info.Series} - Volume {volume.Number}'s chapters. Skipping Chapter."); } } foreach (var chapter in volume.Chapters) { chapter.Pages = chapter.Files.Sum(f => f.NumberOfPages); if (ShouldFindCoverImage(chapter.CoverImage)) { chapter.Files ??= new List(); var firstFile = chapter.Files.OrderBy(x => x.Chapter).FirstOrDefault(); if (firstFile != null) chapter.CoverImage = _archiveService.GetCoverImage(firstFile.FilePath, true); } } } private void AddOrUpdateFileForChapter(Chapter chapter, ParserInfo info) { chapter.Files ??= new List(); var existingFile = chapter.Files.SingleOrDefault(f => f.FilePath == info.FullFilePath); if (existingFile != null) { existingFile.Format = info.Format; existingFile.NumberOfPages = _archiveService.GetNumberOfPagesFromArchive(info.FullFilePath); } else { if (info.Format == MangaFormat.Archive) { chapter.Files.Add(CreateMangaFile(info)); } else { _logger.LogDebug($"Ignoring {info.Filename}. Non-archives are not supported yet."); } } } public static Volume ExistingOrDefault(IList existingVolumes, ICollection volumes, string volumeName) { return volumes.SingleOrDefault(v => v.Name == volumeName) ?? existingVolumes.SingleOrDefault(v => v.Name == volumeName); } public static Series ExistingOrDefault(Library library, IEnumerable allSeries, string seriesName) { var name = Parser.Parser.Normalize(seriesName); library.Series ??= new List(); return library.Series.SingleOrDefault(s => Parser.Parser.Normalize(s.Name) == name) ?? allSeries.SingleOrDefault(s => Parser.Parser.Normalize(s.Name) == name); } private void UpdateVolumes(Series series, ParserInfo[] infos) { series.Volumes ??= new List(); _logger.LogDebug($"Updating Volumes for {series.Name}. {infos.Length} related files."); IList existingVolumes = _unitOfWork.SeriesRepository.GetVolumes(series.Id).ToList(); foreach (var info in infos) { try { var volume = ExistingOrDefault(existingVolumes, series.Volumes, info.Volumes) ?? new Volume { Name = info.Volumes, Number = (int) Parser.Parser.MinimumNumberFromRange(info.Volumes), IsSpecial = false, Chapters = new List() }; if (series.Volumes.Any(v => v.Name == volume.Name)) continue; series.Volumes.Add(volume); } catch (Exception ex) { _logger.LogError(ex, $"There was an exception when creating volume {info.Volumes}. Skipping volume."); } } foreach (var volume in series.Volumes) { try { var justVolumeInfos = infos.Where(pi => pi.Volumes == volume.Name).ToArray(); UpdateChapters(volume, justVolumeInfos); volume.Pages = volume.Chapters.Sum(c => c.Pages); _logger.LogDebug($"Created {volume.Chapters.Count} chapters on {series.Name} - Volume {volume.Name}"); } catch (Exception ex) { _logger.LogError(ex, $"There was an exception when creating volume {volume.Name}. Skipping volume."); } } foreach (var volume in series.Volumes) { if (ShouldFindCoverImage(volume.CoverImage)) { // TODO: Create a custom sorter for Chapters so it's consistent across the application var firstChapter = volume.Chapters.OrderBy(x => Double.Parse(x.Number)).FirstOrDefault(); var firstFile = firstChapter?.Files.OrderBy(x => x.Chapter).FirstOrDefault(); if (firstFile != null) volume.CoverImage = _archiveService.GetCoverImage(firstFile.FilePath, true); } } } } }