2023-07-30 21:27:02 -04:00
|
|
|
using System;
|
|
|
|
|
using System.Collections.Generic;
|
|
|
|
|
using System.Linq;
|
|
|
|
|
using SabreTools.Core;
|
|
|
|
|
using SabreTools.DatItems;
|
|
|
|
|
using SabreTools.DatItems.Formats;
|
|
|
|
|
|
|
|
|
|
namespace SabreTools.DatFiles.Formats
|
|
|
|
|
{
|
|
|
|
|
/// <summary>
|
|
|
|
|
/// Represents parsing and writing of a Archive.org file list
|
|
|
|
|
/// </summary>
|
|
|
|
|
internal partial class ArchiveDotOrg : DatFile
|
|
|
|
|
{
|
|
|
|
|
/// <inheritdoc/>
|
|
|
|
|
protected override ItemType[] GetSupportedTypes()
|
|
|
|
|
{
|
2024-02-28 19:19:50 -05:00
|
|
|
return
|
|
|
|
|
[
|
2023-07-30 21:27:02 -04:00
|
|
|
ItemType.Rom,
|
2024-02-28 19:19:50 -05:00
|
|
|
];
|
2023-07-30 21:27:02 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// <inheritdoc/>
|
2024-03-05 23:41:00 -05:00
|
|
|
protected override List<string>? GetMissingRequiredFields(DatItem datItem)
|
2023-07-30 21:27:02 -04:00
|
|
|
{
|
2024-03-05 23:41:00 -05:00
|
|
|
var missingFields = new List<string>();
|
2023-07-30 21:27:02 -04:00
|
|
|
|
|
|
|
|
// Check item name
|
2024-02-28 22:54:56 -05:00
|
|
|
if (string.IsNullOrEmpty(datItem.GetName()))
|
2024-03-05 23:41:00 -05:00
|
|
|
missingFields.Add(Models.Metadata.Rom.NameKey);
|
2023-07-30 21:27:02 -04:00
|
|
|
|
|
|
|
|
switch (datItem)
|
|
|
|
|
{
|
|
|
|
|
case Rom rom:
|
2024-03-09 21:34:26 -05:00
|
|
|
if (rom.GetFieldValue<long?>(Models.Metadata.Rom.SizeKey) == null || rom.GetFieldValue<long?>(Models.Metadata.Rom.SizeKey) < 0)
|
2024-03-05 23:41:00 -05:00
|
|
|
missingFields.Add(Models.Metadata.Rom.SizeKey);
|
2024-03-09 21:34:26 -05:00
|
|
|
if (string.IsNullOrEmpty(rom.GetFieldValue<string?>(Models.Metadata.Rom.CRCKey))
|
|
|
|
|
&& string.IsNullOrEmpty(rom.GetFieldValue<string?>(Models.Metadata.Rom.MD5Key))
|
|
|
|
|
&& string.IsNullOrEmpty(rom.GetFieldValue<string?>(Models.Metadata.Rom.SHA1Key)))
|
2023-07-30 21:27:02 -04:00
|
|
|
{
|
2024-03-05 23:41:00 -05:00
|
|
|
missingFields.Add(Models.Metadata.Rom.SHA1Key);
|
2023-07-30 21:27:02 -04:00
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return missingFields;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// <inheritdoc/>
|
|
|
|
|
public override bool WriteToFile(string outfile, bool ignoreblanks = false, bool throwOnError = false)
|
|
|
|
|
{
|
|
|
|
|
try
|
|
|
|
|
{
|
|
|
|
|
logger.User($"Writing to '{outfile}'...");
|
|
|
|
|
|
|
|
|
|
var files = CreateFiles(ignoreblanks);
|
2023-09-11 01:20:21 -04:00
|
|
|
if (!(new Serialization.Files.ArchiveDotOrg().Serialize(files, outfile)))
|
2023-07-30 21:27:02 -04:00
|
|
|
{
|
|
|
|
|
logger.Warning($"File '{outfile}' could not be written! See the log for more details.");
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
catch (Exception ex) when (!throwOnError)
|
|
|
|
|
{
|
|
|
|
|
logger.Error(ex);
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
2023-07-31 11:33:03 -04:00
|
|
|
logger.User($"'{outfile}' written!{Environment.NewLine}");
|
2023-07-30 21:27:02 -04:00
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#region Converters
|
|
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
|
/// Create a Files from the current internal information
|
|
|
|
|
/// <summary>
|
|
|
|
|
/// <param name="ignoreblanks">True if blank roms should be skipped on output, false otherwise</param>
|
2023-08-10 23:22:14 -04:00
|
|
|
private Models.ArchiveDotOrg.Files? CreateFiles(bool ignoreblanks)
|
2023-07-30 21:27:02 -04:00
|
|
|
{
|
|
|
|
|
// If we don't have items, we can't do anything
|
|
|
|
|
if (this.Items == null || !this.Items.Any())
|
|
|
|
|
return null;
|
|
|
|
|
|
|
|
|
|
// Create a list of hold the files
|
|
|
|
|
var files = new List<Models.ArchiveDotOrg.File>();
|
|
|
|
|
|
|
|
|
|
// Loop through the sorted items and create games for them
|
|
|
|
|
foreach (string key in Items.SortedKeys)
|
|
|
|
|
{
|
|
|
|
|
var items = Items.FilteredItems(key);
|
|
|
|
|
if (items == null || !items.Any())
|
|
|
|
|
continue;
|
|
|
|
|
|
|
|
|
|
// Loop through and convert the items to respective lists
|
2023-07-30 23:50:55 -04:00
|
|
|
for (int index = 0; index < items.Count; index++)
|
2023-07-30 21:27:02 -04:00
|
|
|
{
|
2023-07-30 23:50:55 -04:00
|
|
|
// Get the item
|
|
|
|
|
var item = items[index];
|
|
|
|
|
|
|
|
|
|
// Check for a "null" item
|
|
|
|
|
item = ProcessNullifiedItem(item);
|
|
|
|
|
|
2023-07-30 21:27:02 -04:00
|
|
|
// Skip if we're ignoring the item
|
|
|
|
|
if (ShouldIgnore(item, ignoreblanks))
|
|
|
|
|
continue;
|
|
|
|
|
|
|
|
|
|
switch (item)
|
|
|
|
|
{
|
|
|
|
|
case Rom rom:
|
|
|
|
|
files.Add(CreateFile(rom));
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2024-02-28 19:19:50 -05:00
|
|
|
return new Models.ArchiveDotOrg.Files { File = [.. files] };
|
2023-07-30 21:27:02 -04:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/// <summary>
|
|
|
|
|
/// Create a File from the current Rom DatItem
|
|
|
|
|
/// <summary>
|
|
|
|
|
private static Models.ArchiveDotOrg.File CreateFile(Rom item)
|
|
|
|
|
{
|
|
|
|
|
var file = new Models.ArchiveDotOrg.File
|
|
|
|
|
{
|
2024-03-08 20:42:24 -05:00
|
|
|
Name = item.GetName(),
|
2024-03-09 21:34:26 -05:00
|
|
|
Source = item.GetFieldValue<string?>(Models.Metadata.Rom.SourceKey),
|
|
|
|
|
BitTorrentMagnetHash = item.GetFieldValue<string?>(Models.Metadata.Rom.BitTorrentMagnetHashKey),
|
|
|
|
|
Size = item.GetFieldValue<long?>(Models.Metadata.Rom.SizeKey)?.ToString(),
|
|
|
|
|
MD5 = item.GetFieldValue<string?>(Models.Metadata.Rom.MD5Key),
|
|
|
|
|
CRC32 = item.GetFieldValue<string?>(Models.Metadata.Rom.CRCKey),
|
|
|
|
|
SHA1 = item.GetFieldValue<string?>(Models.Metadata.Rom.SHA1Key),
|
|
|
|
|
FileCount = item.GetFieldValue<string?>(Models.Metadata.Rom.FileCountKey),
|
|
|
|
|
Format = item.GetFieldValue<string?>(Models.Metadata.Rom.FormatKey),
|
|
|
|
|
Original = item.GetFieldValue<string?>(Models.Metadata.Rom.OriginalKey),
|
|
|
|
|
Summation = item.GetFieldValue<string?>(Models.Metadata.Rom.SummationKey),
|
|
|
|
|
MatrixNumber = item.GetFieldValue<string?>(Models.Metadata.Rom.MatrixNumberKey),
|
|
|
|
|
CollectionCatalogNumber = item.GetFieldValue<string?>(Models.Metadata.Rom.CollectionCatalogNumberKey),
|
2023-07-30 21:27:02 -04:00
|
|
|
|
|
|
|
|
// ASR-Related
|
2024-03-09 21:34:26 -05:00
|
|
|
ASRDetectedLang = item.GetFieldValue<string?>(Models.Metadata.Rom.ASRDetectedLangKey),
|
|
|
|
|
ASRDetectedLangConf = item.GetFieldValue<string?>(Models.Metadata.Rom.ASRDetectedLangConfKey),
|
|
|
|
|
ASRTranscribedLang = item.GetFieldValue<string?>(Models.Metadata.Rom.ASRTranscribedLangKey),
|
|
|
|
|
WhisperASRModuleVersion = item.GetFieldValue<string?>(Models.Metadata.Rom.WhisperASRModuleVersionKey),
|
|
|
|
|
WhisperModelHash = item.GetFieldValue<string?>(Models.Metadata.Rom.WhisperModelHashKey),
|
|
|
|
|
WhisperModelName = item.GetFieldValue<string?>(Models.Metadata.Rom.WhisperModelNameKey),
|
|
|
|
|
WhisperVersion = item.GetFieldValue<string?>(Models.Metadata.Rom.WhisperVersionKey),
|
2023-07-30 21:27:02 -04:00
|
|
|
|
|
|
|
|
// OCR-Related
|
2024-03-09 21:34:26 -05:00
|
|
|
ClothCoverDetectionModuleVersion = item.GetFieldValue<string?>(Models.Metadata.Rom.ClothCoverDetectionModuleVersionKey),
|
|
|
|
|
hOCRCharToWordhOCRVersion = item.GetFieldValue<string?>(Models.Metadata.Rom.hOCRCharToWordhOCRVersionKey),
|
|
|
|
|
hOCRCharToWordModuleVersion = item.GetFieldValue<string?>(Models.Metadata.Rom.hOCRCharToWordModuleVersionKey),
|
|
|
|
|
hOCRFtsTexthOCRVersion = item.GetFieldValue<string?>(Models.Metadata.Rom.hOCRFtsTexthOCRVersionKey),
|
|
|
|
|
hOCRFtsTextModuleVersion = item.GetFieldValue<string?>(Models.Metadata.Rom.hOCRFtsTextModuleVersionKey),
|
|
|
|
|
hOCRPageIndexhOCRVersion = item.GetFieldValue<string?>(Models.Metadata.Rom.hOCRPageIndexhOCRVersionKey),
|
|
|
|
|
hOCRPageIndexModuleVersion = item.GetFieldValue<string?>(Models.Metadata.Rom.hOCRPageIndexModuleVersionKey),
|
|
|
|
|
TesseractOCR = item.GetFieldValue<string?>(Models.Metadata.Rom.TesseractOCRKey),
|
|
|
|
|
TesseractOCRConverted = item.GetFieldValue<string?>(Models.Metadata.Rom.TesseractOCRConvertedKey),
|
|
|
|
|
TesseractOCRDetectedLang = item.GetFieldValue<string?>(Models.Metadata.Rom.TesseractOCRDetectedLangKey),
|
|
|
|
|
TesseractOCRDetectedLangConf = item.GetFieldValue<string?>(Models.Metadata.Rom.TesseractOCRDetectedLangConfKey),
|
|
|
|
|
TesseractOCRDetectedScript = item.GetFieldValue<string?>(fieldName: Models.Metadata.Rom.TesseractOCRDetectedScriptKey),
|
|
|
|
|
TesseractOCRDetectedScriptConf = item.GetFieldValue<string?>(Models.Metadata.Rom.TesseractOCRDetectedScriptConfKey),
|
|
|
|
|
TesseractOCRParameters = item.GetFieldValue<string?>(Models.Metadata.Rom.TesseractOCRParametersKey),
|
|
|
|
|
TesseractOCRModuleVersion = item.GetFieldValue<string?>(Models.Metadata.Rom.TesseractOCRModuleVersionKey),
|
|
|
|
|
PDFModuleVersion = item.GetFieldValue<string?>(Models.Metadata.Rom.PDFModuleVersionKey),
|
|
|
|
|
WordConfidenceInterval0To10 = item.GetFieldValue<string?>(Models.Metadata.Rom.WordConfidenceInterval0To10Key),
|
|
|
|
|
WordConfidenceInterval11To20 = item.GetFieldValue<string?>(Models.Metadata.Rom.WordConfidenceInterval11To20Key),
|
|
|
|
|
WordConfidenceInterval21To30 = item.GetFieldValue<string?>(Models.Metadata.Rom.WordConfidenceInterval21To30Key),
|
|
|
|
|
WordConfidenceInterval31To40 = item.GetFieldValue<string?>(Models.Metadata.Rom.WordConfidenceInterval31To40Key),
|
|
|
|
|
WordConfidenceInterval41To50 = item.GetFieldValue<string?>(Models.Metadata.Rom.WordConfidenceInterval41To50Key),
|
|
|
|
|
WordConfidenceInterval51To60 = item.GetFieldValue<string?>(Models.Metadata.Rom.WordConfidenceInterval51To60Key),
|
|
|
|
|
WordConfidenceInterval61To70 = item.GetFieldValue<string?>(Models.Metadata.Rom.WordConfidenceInterval61To70Key),
|
|
|
|
|
WordConfidenceInterval71To80 = item.GetFieldValue<string?>(Models.Metadata.Rom.WordConfidenceInterval71To80Key),
|
|
|
|
|
WordConfidenceInterval81To90 = item.GetFieldValue<string?>(Models.Metadata.Rom.WordConfidenceInterval81To90Key),
|
|
|
|
|
WordConfidenceInterval91To100 = item.GetFieldValue<string?>(Models.Metadata.Rom.WordConfidenceInterval91To100Key),
|
2023-07-30 21:27:02 -04:00
|
|
|
|
|
|
|
|
// Media-Related
|
2024-03-09 21:34:26 -05:00
|
|
|
Album = item.GetFieldValue<string?>(Models.Metadata.Rom.AlbumKey),
|
|
|
|
|
Artist = item.GetFieldValue<string?>(Models.Metadata.Rom.ArtistKey),
|
|
|
|
|
Bitrate = item.GetFieldValue<string?>(Models.Metadata.Rom.BitrateKey),
|
|
|
|
|
Creator = item.GetFieldValue<string?>(Models.Metadata.Rom.CreatorKey),
|
|
|
|
|
Height = item.GetFieldValue<string?>(Models.Metadata.Rom.HeightKey),
|
|
|
|
|
Length = item.GetFieldValue<string?>(Models.Metadata.Rom.LengthKey),
|
|
|
|
|
PreviewImage = item.GetFieldValue<string?>(Models.Metadata.Rom.PreviewImageKey),
|
|
|
|
|
Rotation = item.GetFieldValue<string?>(Models.Metadata.Rom.RotationKey),
|
|
|
|
|
Title = item.GetFieldValue<string?>(Models.Metadata.Rom.TitleKey),
|
|
|
|
|
Track = item.GetFieldValue<string?>(Models.Metadata.Rom.TrackKey),
|
|
|
|
|
Width = item.GetFieldValue<string?>(Models.Metadata.Rom.WidthKey),
|
2023-07-30 21:27:02 -04:00
|
|
|
|
|
|
|
|
};
|
|
|
|
|
|
2024-03-09 21:34:26 -05:00
|
|
|
if (long.TryParse(item.GetFieldValue<string?>(Models.Metadata.Rom.DateKey) ?? string.Empty, out long lastModifiedTime))
|
2023-07-30 21:27:02 -04:00
|
|
|
file.LastModifiedTime = lastModifiedTime.ToString();
|
|
|
|
|
|
|
|
|
|
return file;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
#endregion
|
|
|
|
|
}
|
|
|
|
|
}
|