2021-09-27 12:42:46 +00:00
|
|
|
using System;
|
|
|
|
using System.Collections.Generic;
|
2022-06-08 13:12:44 +00:00
|
|
|
using System.IO;
|
2021-09-27 12:42:46 +00:00
|
|
|
using System.Linq;
|
|
|
|
using System.Net.Http;
|
2022-06-08 03:48:13 +00:00
|
|
|
using System.Text.Encodings.Web;
|
2021-09-27 12:42:46 +00:00
|
|
|
using System.Text.RegularExpressions;
|
|
|
|
using System.Threading;
|
|
|
|
using System.Threading.Tasks;
|
2022-06-08 03:48:13 +00:00
|
|
|
using System.Web;
|
|
|
|
using HtmlAgilityPack;
|
2021-09-27 12:42:46 +00:00
|
|
|
using Microsoft.Extensions.Logging;
|
2022-08-21 20:23:11 +00:00
|
|
|
using Wabbajack.Common;
|
2021-09-27 12:42:46 +00:00
|
|
|
using Wabbajack.Downloaders.Interfaces;
|
|
|
|
using Wabbajack.DTOs;
|
|
|
|
using Wabbajack.DTOs.DownloadStates;
|
|
|
|
using Wabbajack.DTOs.Validation;
|
|
|
|
using Wabbajack.Hashing.xxHash64;
|
|
|
|
using Wabbajack.Networking.Http;
|
|
|
|
using Wabbajack.Networking.Http.Interfaces;
|
|
|
|
using Wabbajack.Paths;
|
|
|
|
using Wabbajack.RateLimiter;
|
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
namespace Wabbajack.Downloaders.GoogleDrive;
|
|
|
|
|
2022-06-08 03:48:13 +00:00
|
|
|
public class GoogleDriveDownloader : ADownloader<DTOs.DownloadStates.GoogleDrive>, IUrlDownloader, IProxyable
|
2021-09-27 12:42:46 +00:00
|
|
|
{
|
2021-10-23 16:51:17 +00:00
|
|
|
private static readonly Regex GDriveRegex = new("((?<=id=)[a-zA-Z0-9_-]*)|(?<=\\/file\\/d\\/)[a-zA-Z0-9_-]*",
|
|
|
|
RegexOptions.Compiled);
|
|
|
|
|
|
|
|
private readonly HttpClient _client;
|
|
|
|
private readonly IHttpDownloader _downloader;
|
|
|
|
private readonly ILogger<GoogleDriveDownloader> _logger;
|
|
|
|
|
|
|
|
public GoogleDriveDownloader(ILogger<GoogleDriveDownloader> logger, HttpClient client,
|
|
|
|
IHttpDownloader downloader)
|
2021-09-27 12:42:46 +00:00
|
|
|
{
|
2021-10-23 16:51:17 +00:00
|
|
|
_logger = logger;
|
|
|
|
_client = client;
|
|
|
|
_downloader = downloader;
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public override async Task<bool> Prepare()
|
|
|
|
{
|
|
|
|
return true;
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public override bool IsAllowed(ServerAllowList allowList, IDownloadState state)
|
|
|
|
{
|
|
|
|
return allowList.GoogleIDs.Contains(((DTOs.DownloadStates.GoogleDrive) state).Id);
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public IDownloadState? Parse(Uri uri)
|
|
|
|
{
|
|
|
|
if (uri.Host != "drive.google.com") return null;
|
|
|
|
var match = GDriveRegex.Match(uri.ToString());
|
|
|
|
if (match.Success)
|
|
|
|
return new DTOs.DownloadStates.GoogleDrive {Id = match.ToString()};
|
|
|
|
_logger.LogWarning($"Tried to parse drive.google.com Url but couldn't get an id from: {uri}");
|
|
|
|
return null;
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public Uri UnParse(IDownloadState state)
|
|
|
|
{
|
|
|
|
return new Uri(
|
|
|
|
$"https://drive.google.com/uc?id={(state as DTOs.DownloadStates.GoogleDrive)?.Id}&export=download");
|
|
|
|
}
|
2022-06-08 13:12:44 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public override IDownloadState? Resolve(IReadOnlyDictionary<string, string> iniData)
|
|
|
|
{
|
2022-08-21 20:23:11 +00:00
|
|
|
if (iniData.ContainsKey("directURL") && Uri.TryCreate(iniData["directURL"].CleanIniString(), UriKind.Absolute, out var uri))
|
2021-10-23 16:51:17 +00:00
|
|
|
return Parse(uri);
|
|
|
|
return null;
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public override Priority Priority => Priority.Normal;
|
2022-06-08 13:12:44 +00:00
|
|
|
|
|
|
|
|
|
|
|
public async Task<T> DownloadStream<T>(Archive archive, Func<Stream, Task<T>> fn, CancellationToken token)
|
|
|
|
{
|
|
|
|
var state = archive.State as DTOs.DownloadStates.GoogleDrive;
|
|
|
|
var msg = await ToMessage(state, true, token);
|
|
|
|
using var result = await _client.SendAsync(msg, token);
|
|
|
|
HttpException.ThrowOnFailure(result);
|
|
|
|
await using var stream = await result.Content.ReadAsStreamAsync(token);
|
|
|
|
return await fn(stream);
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public override async Task<Hash> Download(Archive archive, DTOs.DownloadStates.GoogleDrive state,
|
|
|
|
AbsolutePath destination, IJob job, CancellationToken token)
|
|
|
|
{
|
|
|
|
var msg = await ToMessage(state, true, token);
|
|
|
|
return await _downloader.Download(msg!, destination, job, token);
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public override async Task<bool> Verify(Archive archive, DTOs.DownloadStates.GoogleDrive state,
|
|
|
|
IJob job, CancellationToken token)
|
|
|
|
{
|
|
|
|
var result = await ToMessage(state, false, token);
|
|
|
|
return result != null;
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
public override IEnumerable<string> MetaIni(Archive a, DTOs.DownloadStates.GoogleDrive state)
|
|
|
|
{
|
|
|
|
return new[] {$"directURL=https://drive.google.com/uc?id={state.Id}&export=download"};
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
private async Task<HttpRequestMessage?> ToMessage(DTOs.DownloadStates.GoogleDrive state, bool download,
|
|
|
|
CancellationToken token)
|
|
|
|
{
|
|
|
|
if (download)
|
2021-09-27 12:42:46 +00:00
|
|
|
{
|
2021-10-23 16:51:17 +00:00
|
|
|
var initialUrl = $"https://drive.google.com/uc?id={state.Id}&export=download";
|
2022-06-08 13:12:44 +00:00
|
|
|
var msg = new HttpRequestMessage(HttpMethod.Get, initialUrl);
|
|
|
|
msg.UseChromeUserAgent();
|
|
|
|
|
|
|
|
using var response = await _client.SendAsync(msg, token);
|
2021-10-23 16:51:17 +00:00
|
|
|
var cookies = response.GetSetCookies();
|
|
|
|
var warning = cookies.FirstOrDefault(c => c.Key.StartsWith("download_warning_"));
|
2022-06-08 03:48:13 +00:00
|
|
|
|
|
|
|
if (warning == default && response.Content.Headers.ContentType?.MediaType == "text/html")
|
|
|
|
{
|
|
|
|
var doc = new HtmlDocument();
|
|
|
|
var txt = await response.Content.ReadAsStringAsync(token);
|
2022-06-08 13:12:44 +00:00
|
|
|
if (txt.Contains("<title>Google Drive - Quota exceeded</title>"))
|
|
|
|
throw new Exception("Google Drive - Quota Exceeded");
|
2022-06-08 03:48:13 +00:00
|
|
|
|
|
|
|
doc.LoadHtml(txt);
|
|
|
|
|
|
|
|
var action = doc.DocumentNode.DescendantsAndSelf()
|
|
|
|
.Where(d => d.Name == "form" && d.Id == "downloadForm" &&
|
|
|
|
d.GetAttributeValue("method", "") == "post")
|
|
|
|
.Select(d => d.GetAttributeValue("action", ""))
|
|
|
|
.FirstOrDefault();
|
|
|
|
|
|
|
|
if (action != null)
|
|
|
|
warning = ("download_warning_", "t");
|
|
|
|
|
|
|
|
}
|
2021-10-23 16:51:17 +00:00
|
|
|
response.Dispose();
|
2022-06-08 03:48:13 +00:00
|
|
|
if (warning == default)
|
|
|
|
{
|
|
|
|
return new HttpRequestMessage(HttpMethod.Get, initialUrl);
|
|
|
|
}
|
2021-09-27 12:42:46 +00:00
|
|
|
|
2021-10-23 16:51:17 +00:00
|
|
|
var url = $"https://drive.google.com/uc?export=download&confirm={warning.Value}&id={state.Id}";
|
|
|
|
var httpState = new HttpRequestMessage(HttpMethod.Get, url);
|
2022-06-08 13:12:44 +00:00
|
|
|
httpState.UseChromeUserAgent();
|
2021-10-23 16:51:17 +00:00
|
|
|
return httpState;
|
|
|
|
}
|
|
|
|
else
|
2021-09-27 12:42:46 +00:00
|
|
|
{
|
2021-10-23 16:51:17 +00:00
|
|
|
var url = $"https://drive.google.com/file/d/{state.Id}/edit";
|
2022-06-08 13:12:44 +00:00
|
|
|
var msg = new HttpRequestMessage(HttpMethod.Get, url);
|
|
|
|
msg.UseChromeUserAgent();
|
|
|
|
|
|
|
|
using var response = await _client.SendAsync(msg, token);
|
|
|
|
msg = new HttpRequestMessage(HttpMethod.Get, url);
|
|
|
|
msg.UseChromeUserAgent();
|
|
|
|
return !response.IsSuccessStatusCode ? null : msg;
|
2021-09-27 12:42:46 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|