2021-09-27 12:42:46 +00:00
|
|
|
using System;
|
|
|
|
using System.Collections.Generic;
|
|
|
|
using System.IO;
|
|
|
|
using System.Linq;
|
|
|
|
using System.Threading;
|
|
|
|
using System.Threading.Tasks;
|
|
|
|
using Microsoft.Extensions.Logging;
|
|
|
|
using Wabbajack.Common;
|
|
|
|
using Wabbajack.FileExtractor.ExtractedFiles;
|
2023-01-21 19:36:12 +00:00
|
|
|
using Wabbajack.Hashing.PHash;
|
2021-09-27 12:42:46 +00:00
|
|
|
using Wabbajack.Hashing.xxHash64;
|
|
|
|
using Wabbajack.Paths;
|
|
|
|
using Wabbajack.Paths.IO;
|
2021-10-12 12:20:34 +00:00
|
|
|
using Wabbajack.RateLimiter;
|
2022-06-22 01:38:42 +00:00
|
|
|
using Wabbajack.VFS.Interfaces;
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
namespace Wabbajack.VFS;
|
|
|
|
|
|
|
|
public class Context
|
2021-09-27 12:42:46 +00:00
|
|
|
{
|
2021-10-23 16:51:17 +00:00
|
|
|
public const ulong FileVersion = 0x03;
|
|
|
|
public const string Magic = "WABBAJACK VFS FILE";
|
|
|
|
private readonly TemporaryFileManager _manager;
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
private readonly ParallelOptions _parallelOptions;
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public readonly FileExtractor.FileExtractor Extractor;
|
|
|
|
public readonly FileHashCache HashCache;
|
|
|
|
public readonly IResource<Context> Limiter;
|
2021-10-23 22:27:59 +00:00
|
|
|
public readonly IResource<FileHashCache> HashLimiter;
|
2021-10-23 16:51:17 +00:00
|
|
|
public readonly ILogger<Context> Logger;
|
2022-06-22 01:38:42 +00:00
|
|
|
public readonly IVfsCache VfsCache;
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public Context(ILogger<Context> logger, ParallelOptions parallelOptions, TemporaryFileManager manager,
|
2022-06-22 01:38:42 +00:00
|
|
|
IVfsCache vfsCache,
|
2023-01-21 19:36:12 +00:00
|
|
|
FileHashCache hashCache, IResource<Context> limiter, IResource<FileHashCache> hashLimiter,
|
|
|
|
FileExtractor.FileExtractor extractor, IImageLoader imageLoader)
|
2021-10-23 16:51:17 +00:00
|
|
|
{
|
|
|
|
Limiter = limiter;
|
2021-10-23 22:27:59 +00:00
|
|
|
HashLimiter = hashLimiter;
|
2021-10-23 16:51:17 +00:00
|
|
|
Logger = logger;
|
|
|
|
_manager = manager;
|
|
|
|
Extractor = extractor;
|
|
|
|
VfsCache = vfsCache;
|
|
|
|
HashCache = hashCache;
|
|
|
|
_parallelOptions = parallelOptions;
|
2023-01-21 19:36:12 +00:00
|
|
|
ImageLoader = imageLoader;
|
2021-10-23 16:51:17 +00:00
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2022-06-29 13:18:04 +00:00
|
|
|
public Context WithTemporaryFileManager(TemporaryFileManager manager)
|
|
|
|
{
|
|
|
|
return new Context(Logger, _parallelOptions, manager, VfsCache, HashCache, Limiter, HashLimiter,
|
2023-01-21 19:36:12 +00:00
|
|
|
Extractor.WithTemporaryFileManager(manager), ImageLoader);
|
2022-06-29 13:18:04 +00:00
|
|
|
}
|
|
|
|
|
2021-10-23 22:27:59 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public IndexRoot Index { get; private set; } = IndexRoot.Empty;
|
2023-01-21 19:36:12 +00:00
|
|
|
public IImageLoader ImageLoader { get; }
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public async Task<IndexRoot> AddRoot(AbsolutePath root, CancellationToken token)
|
|
|
|
{
|
2022-08-22 15:34:19 +00:00
|
|
|
return await AddRoots(new[] {root}, token);
|
2021-10-23 16:51:17 +00:00
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2022-08-22 15:34:19 +00:00
|
|
|
public async Task<IndexRoot> AddRoots(IEnumerable<AbsolutePath> roots, CancellationToken token, Func<long, long, Task>? updateFunction = null)
|
2021-10-23 16:51:17 +00:00
|
|
|
{
|
|
|
|
var native = Index.AllFiles.Where(file => file.IsNative).ToDictionary(file => file.FullPath.Base);
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
var filtered = Index.AllFiles.Where(file => ((AbsolutePath) file.Name).FileExists()).ToList();
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
var filesToIndex = roots.SelectMany(root => root.EnumerateFiles()).ToList();
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2022-08-19 23:59:29 +00:00
|
|
|
var idx = 0;
|
2021-10-23 16:51:17 +00:00
|
|
|
var allFiles = await filesToIndex
|
|
|
|
.PMapAll(async f =>
|
|
|
|
{
|
2022-08-19 23:59:29 +00:00
|
|
|
using var job = await Limiter.Begin($"Indexing {f.FileName}", 0, token);
|
2021-10-23 16:51:17 +00:00
|
|
|
if (native.TryGetValue(f, out var found))
|
|
|
|
if (found.LastModified == f.LastModifiedUtc().AsUnixTime() && found.Size == f.Size())
|
|
|
|
return found;
|
2022-08-19 23:59:29 +00:00
|
|
|
Interlocked.Increment(ref idx);
|
|
|
|
updateFunction?.Invoke(idx, filesToIndex.Count);
|
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
return await VirtualFile.Analyze(this, null, new NativeFileStreamFactory(f), f, token);
|
|
|
|
}).ToList();
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
var newIndex = await IndexRoot.Empty.Integrate(filtered.Concat(allFiles).ToList());
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
lock (this)
|
|
|
|
{
|
|
|
|
Index = newIndex;
|
2021-09-27 12:42:46 +00:00
|
|
|
}
|
|
|
|
|
2022-08-22 15:34:19 +00:00
|
|
|
await VfsCache.Clean();
|
2022-08-19 23:59:29 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
return newIndex;
|
|
|
|
}
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
/// Extracts a file
|
|
|
|
/// </summary>
|
|
|
|
/// <param name="queue">Work queue to use when required by some formats</param>
|
|
|
|
/// <param name="files">Predefined list of files to extract, all others will be skipped</param>
|
|
|
|
/// <param name="callback">Func called for each file extracted</param>
|
|
|
|
/// <param name="tempFolder">Optional: folder to use for temporary storage</param>
|
2022-08-22 23:15:19 +00:00
|
|
|
/// <param name="runInParallel">Optional: run `callback`s in parallel</param>
|
2021-10-23 16:51:17 +00:00
|
|
|
/// <returns></returns>
|
|
|
|
/// <exception cref="Exception"></exception>
|
|
|
|
public async Task Extract(HashSet<VirtualFile> files, Func<VirtualFile, IExtractedFile, ValueTask> callback,
|
2022-08-22 23:15:19 +00:00
|
|
|
CancellationToken token, AbsolutePath? tempFolder = null, bool runInParallel = true)
|
2021-10-23 16:51:17 +00:00
|
|
|
{
|
|
|
|
var top = new VirtualFile();
|
|
|
|
var filesByParent = files.SelectMany(f => f.FilesInFullPath)
|
|
|
|
.Distinct()
|
|
|
|
.GroupBy(f => f.Parent ?? top)
|
|
|
|
.ToDictionary(f => f.Key);
|
|
|
|
|
|
|
|
async Task HandleFile(VirtualFile file, IExtractedFile sfn)
|
2021-09-27 12:42:46 +00:00
|
|
|
{
|
2021-10-23 16:51:17 +00:00
|
|
|
if (filesByParent.ContainsKey(file))
|
|
|
|
sfn.CanMove = false;
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
if (files.Contains(file)) await callback(file, sfn);
|
|
|
|
if (filesByParent.TryGetValue(file, out var children))
|
2021-09-27 12:42:46 +00:00
|
|
|
{
|
2021-10-23 16:51:17 +00:00
|
|
|
var fileNames = children.ToDictionary(c => c.RelativeName);
|
|
|
|
try
|
|
|
|
{
|
|
|
|
await Extractor.GatheringExtract(sfn,
|
|
|
|
r => fileNames.ContainsKey(r),
|
|
|
|
async (rel, csf) =>
|
|
|
|
{
|
|
|
|
await HandleFile(fileNames[rel], csf);
|
|
|
|
return 0;
|
|
|
|
},
|
|
|
|
token,
|
|
|
|
fileNames.Keys.ToHashSet());
|
|
|
|
}
|
2022-10-07 22:57:12 +00:00
|
|
|
catch (Exception)
|
2021-09-27 12:42:46 +00:00
|
|
|
{
|
2021-10-23 16:51:17 +00:00
|
|
|
await using var stream = await sfn.GetStream();
|
|
|
|
var hash = await stream.HashingCopy(Stream.Null, token);
|
|
|
|
if (hash != file.Hash)
|
|
|
|
throw new Exception(
|
|
|
|
$"File {file.FullPath} is corrupt, please delete it and retry the installation");
|
|
|
|
throw;
|
2021-09-27 12:42:46 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-08-22 23:15:19 +00:00
|
|
|
if (runInParallel)
|
|
|
|
{
|
|
|
|
await filesByParent[top].PDoAll(
|
|
|
|
async file => await HandleFile(file, new ExtractedNativeFile(file.AbsoluteName) {CanMove = false}));
|
|
|
|
}
|
|
|
|
else
|
|
|
|
{
|
|
|
|
foreach (var file in filesByParent[top])
|
|
|
|
{
|
|
|
|
await HandleFile(file, new ExtractedNativeFile(file.AbsoluteName) {CanMove = false});
|
|
|
|
}
|
|
|
|
}
|
2021-10-23 16:51:17 +00:00
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
#region KnownFiles
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
private List<HashRelativePath> _knownFiles = new();
|
|
|
|
private readonly Dictionary<Hash, AbsolutePath> _knownArchives = new();
|
2021-09-27 12:42:46 +00:00
|
|
|
|
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public void AddKnown(IEnumerable<HashRelativePath> known, Dictionary<Hash, AbsolutePath> archives)
|
|
|
|
{
|
|
|
|
_knownFiles.AddRange(known);
|
|
|
|
foreach (var (key, value) in archives)
|
|
|
|
_knownArchives.TryAdd(key, value);
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-11-03 05:03:41 +00:00
|
|
|
public async ValueTask BackfillMissing()
|
2021-10-23 16:51:17 +00:00
|
|
|
{
|
|
|
|
var newFiles = _knownArchives.ToDictionary(kv => kv.Key,
|
|
|
|
kv => new VirtualFile
|
|
|
|
{
|
|
|
|
Name = kv.Value,
|
|
|
|
Size = kv.Value.Size(),
|
|
|
|
Hash = kv.Key
|
|
|
|
});
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
foreach (var f in newFiles.Values)
|
|
|
|
f.FillFullPath(0);
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
var parentchild = new Dictionary<(VirtualFile, RelativePath), VirtualFile>();
|
|
|
|
|
|
|
|
void BackFillOne(HashRelativePath file)
|
|
|
|
{
|
|
|
|
var parent = newFiles[file.Hash];
|
|
|
|
foreach (var path in file.Parts)
|
2021-09-27 12:42:46 +00:00
|
|
|
{
|
2021-10-23 16:51:17 +00:00
|
|
|
if (parentchild.TryGetValue((parent, path), out var foundParent))
|
2021-09-27 12:42:46 +00:00
|
|
|
{
|
2021-10-23 16:51:17 +00:00
|
|
|
parent = foundParent;
|
|
|
|
continue;
|
2021-09-27 12:42:46 +00:00
|
|
|
}
|
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
var nf = new VirtualFile {Name = path, Parent = parent};
|
|
|
|
nf.FillFullPath();
|
|
|
|
parent.Children = parent.Children.Add(nf);
|
|
|
|
parentchild.Add((parent, path), nf);
|
|
|
|
parent = nf;
|
|
|
|
}
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
_knownFiles.Where(f => f.Parts.Length > 0).Do(BackFillOne);
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
var newIndex = await Index.Integrate(newFiles.Values.ToList());
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
lock (this)
|
|
|
|
{
|
|
|
|
Index = newIndex;
|
2021-09-27 12:42:46 +00:00
|
|
|
}
|
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
_knownFiles = new List<HashRelativePath>();
|
2021-09-27 12:42:46 +00:00
|
|
|
}
|
2021-10-23 16:51:17 +00:00
|
|
|
|
|
|
|
#endregion
|
2021-09-27 12:42:46 +00:00
|
|
|
}
|