Files
SabreTools/SabreTools.DatFiles/DatFileTool.cs

1704 lines
73 KiB
C#
Raw Normal View History

2024-11-12 21:12:06 -05:00
using System;
2020-12-10 14:47:38 -08:00
using System.Collections.Generic;
using System.IO;
using System.Linq;
2024-03-05 03:04:47 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
using System.Threading.Tasks;
2024-03-05 03:04:47 -05:00
#endif
using SabreTools.Core.Tools;
2025-01-08 17:11:52 -05:00
using SabreTools.DatFiles.Formats;
2020-12-10 14:47:38 -08:00
using SabreTools.DatItems;
using SabreTools.DatItems.Formats;
2020-12-10 14:47:38 -08:00
using SabreTools.IO;
2024-10-24 00:36:44 -04:00
using SabreTools.IO.Logging;
using SabreTools.Matching.Compare;
2020-12-10 10:39:39 -08:00
namespace SabreTools.DatFiles
2020-12-10 10:39:39 -08:00
{
/// <summary>
/// Helper methods for updating and converting DatFiles
/// </summary>
public static class DatFileTool
2020-12-10 10:39:39 -08:00
{
#region Logging
/// <summary>
/// Logging object
/// </summary>
2025-01-08 16:59:44 -05:00
private static readonly Logger _staticLogger = new();
2020-12-10 10:39:39 -08:00
#endregion
2020-12-10 14:47:38 -08:00
2025-01-08 17:11:52 -05:00
#region Creation
/// <summary>
/// Create a specific type of DatFile to be used based on a format and a base DAT
/// </summary>
/// <param name="datFormat">Format of the DAT to be created, default is <see cref="DatFormat.Logiqx"/> </param>
/// <param name="baseDat">DatFile containing the information to use in specific operations, default is null</param>
2025-01-08 17:11:52 -05:00
/// <returns>DatFile of the specific internal type that corresponds to the inputs</returns>
public static DatFile CreateDatFile(DatFormat datFormat = DatFormat.Logiqx, DatFile? baseDat = null)
2025-01-08 17:11:52 -05:00
{
return datFormat switch
{
DatFormat.ArchiveDotOrg => new ArchiveDotOrg(baseDat),
DatFormat.AttractMode => new AttractMode(baseDat),
DatFormat.ClrMamePro => new ClrMamePro(baseDat),
2025-01-08 17:11:52 -05:00
DatFormat.CSV => new CommaSeparatedValue(baseDat),
DatFormat.DOSCenter => new DosCenter(baseDat),
DatFormat.EverdriveSMDB => new EverdriveSMDB(baseDat),
DatFormat.Listrom => new Listrom(baseDat),
DatFormat.Listxml => new Listxml(baseDat),
DatFormat.Logiqx => new Logiqx(baseDat, false),
DatFormat.LogiqxDeprecated => new Logiqx(baseDat, true),
DatFormat.MissFile => new Missfile(baseDat),
DatFormat.OfflineList => new OfflineList(baseDat),
DatFormat.OpenMSX => new OpenMSX(baseDat),
2025-01-08 17:17:16 -05:00
DatFormat.RedumpMD2 => new Md2File(baseDat),
DatFormat.RedumpMD4 => new Md4File(baseDat),
2025-01-08 17:11:52 -05:00
DatFormat.RedumpMD5 => new Md5File(baseDat),
DatFormat.RedumpSFV => new SfvFile(baseDat),
DatFormat.RedumpSHA1 => new Sha1File(baseDat),
DatFormat.RedumpSHA256 => new Sha256File(baseDat),
DatFormat.RedumpSHA384 => new Sha384File(baseDat),
DatFormat.RedumpSHA512 => new Sha512File(baseDat),
DatFormat.RedumpSpamSum => new SpamSumFile(baseDat),
DatFormat.RomCenter => new RomCenter(baseDat),
DatFormat.SabreJSON => new SabreJSON(baseDat),
DatFormat.SabreXML => new SabreXML(baseDat),
DatFormat.SoftwareList => new Formats.SoftwareList(baseDat),
DatFormat.SSV => new SemicolonSeparatedValue(baseDat),
DatFormat.TSV => new TabSeparatedValue(baseDat),
// We use new-style Logiqx as a backup for generic DatFile
_ => new Logiqx(baseDat, false),
};
}
/// <summary>
/// Create a new DatFile from an existing DatHeader
/// </summary>
/// <param name="datHeader">DatHeader to get the values from</param>
public static DatFile CreateDatFile(DatHeader datHeader)
{
DatFormat format = datHeader.GetFieldValue<DatFormat>(DatHeader.DatFormatKey);
DatFile datFile = CreateDatFile(format);
datFile.SetHeader(datHeader);
return datFile;
}
#endregion
#region Sorting and Merging
/// <summary>
/// Merge an arbitrary set of DatItems based on the supplied information
/// </summary>
/// <param name="items">List of DatItem objects representing the items to be merged</param>
/// <returns>A List of DatItem objects representing the merged items</returns>
public static List<DatItem> Merge(List<DatItem>? items)
{
// Check for null or blank inputs first
if (items == null || items.Count == 0)
return [];
// Create output list
List<DatItem> output = [];
// Then deduplicate them by checking to see if data matches previous saved roms
int nodumpCount = 0;
foreach (DatItem datItem in items)
{
// If we don't have a Disk, File, Media, or Rom, we skip checking for duplicates
if (datItem is not Disk && datItem is not DatItems.Formats.File && datItem is not Media && datItem is not Rom)
continue;
// If it's a nodump, add and skip
if (datItem is Rom rom && rom.GetStringFieldValue(Models.Metadata.Rom.StatusKey).AsEnumValue<ItemStatus>() == ItemStatus.Nodump)
{
output.Add(datItem);
nodumpCount++;
continue;
}
else if (datItem is Disk disk && disk.GetStringFieldValue(Models.Metadata.Disk.StatusKey).AsEnumValue<ItemStatus>() == ItemStatus.Nodump)
{
output.Add(datItem);
nodumpCount++;
continue;
}
// If it's the first non-nodump item in the list, don't touch it
if (output.Count == nodumpCount)
{
output.Add(datItem);
continue;
}
// Find the index of the first duplicate, if one exists
int pos = output.FindIndex(lastItem => datItem.GetDuplicateStatus(lastItem) != 0x00);
if (pos < 0)
{
output.Add(datItem);
continue;
}
// Get the duplicate item
DatItem savedItem = output[pos];
DupeType dupetype = datItem.GetDuplicateStatus(savedItem);
// Disks, File, Media, and Roms have more information to fill
if (datItem is Disk diskItem && savedItem is Disk savedDisk)
savedDisk.FillMissingInformation(diskItem);
else if (datItem is DatItems.Formats.File fileItem && savedItem is DatItems.Formats.File savedFile)
savedFile.FillMissingInformation(fileItem);
else if (datItem is Media mediaItem && savedItem is Media savedMedia)
savedMedia.FillMissingInformation(mediaItem);
else if (datItem is Rom romItem && savedItem is Rom savedRom)
savedRom.FillMissingInformation(romItem);
// Set the duplicate type on the saved item
savedItem.SetFieldValue<DupeType>(DatItem.DupeTypeKey, dupetype);
// Get the sources associated with the items
var savedSource = savedItem.GetFieldValue<Source?>(DatItem.SourceKey);
var itemSource = datItem.GetFieldValue<Source?>(DatItem.SourceKey);
// Get the machines associated with the items
var savedMachine = savedItem.GetFieldValue<Machine>(DatItem.MachineKey);
var itemMachine = datItem.GetFieldValue<Machine>(DatItem.MachineKey);
// If the current source has a lower ID than the saved, use the saved source
if (itemSource?.Index < savedSource?.Index)
{
datItem.SetFieldValue<Source?>(DatItem.SourceKey, savedSource.Clone() as Source);
savedItem.CopyMachineInformation(datItem);
savedItem.SetName(datItem.GetName());
}
// If the saved machine is a child of the current machine, use the current machine instead
if (savedMachine?.GetStringFieldValue(Models.Metadata.Machine.CloneOfKey) == itemMachine?.GetStringFieldValue(Models.Metadata.Machine.NameKey)
|| savedMachine?.GetStringFieldValue(Models.Metadata.Machine.RomOfKey) == itemMachine?.GetStringFieldValue(Models.Metadata.Machine.NameKey))
{
savedItem.CopyMachineInformation(datItem);
savedItem.SetName(datItem.GetName());
}
// Replace the original item in the list
output.RemoveAt(pos);
output.Insert(pos, savedItem);
}
// Then return the result
return output;
}
/// <summary>
/// Sort a list of DatItem objects by SourceID, Game, and Name (in order)
/// </summary>
/// <param name="items">List of DatItem objects representing the items to be sorted</param>
/// <param name="norename">True if files are not renamed, false otherwise</param>
/// <returns>True if it sorted correctly, false otherwise</returns>
public static bool Sort(ref List<DatItem> items, bool norename)
{
items.Sort(delegate (DatItem x, DatItem y)
{
try
{
var nc = new NaturalComparer();
// If machine names don't match
string? xMachineName = x.GetFieldValue<Machine>(DatItem.MachineKey)?.GetStringFieldValue(Models.Metadata.Machine.NameKey);
string? yMachineName = y.GetFieldValue<Machine>(DatItem.MachineKey)?.GetStringFieldValue(Models.Metadata.Machine.NameKey);
if (xMachineName != yMachineName)
return nc.Compare(xMachineName, yMachineName);
// If types don't match
string? xType = x.GetStringFieldValue(Models.Metadata.DatItem.TypeKey);
string? yType = y.GetStringFieldValue(Models.Metadata.DatItem.TypeKey);
if (xType != yType)
return xType.AsEnumValue<ItemType>() - yType.AsEnumValue<ItemType>();
// If directory names don't match
string? xDirectoryName = Path.GetDirectoryName(TextHelper.RemovePathUnsafeCharacters(x.GetName() ?? string.Empty));
string? yDirectoryName = Path.GetDirectoryName(TextHelper.RemovePathUnsafeCharacters(y.GetName() ?? string.Empty));
if (xDirectoryName != yDirectoryName)
return nc.Compare(xDirectoryName, yDirectoryName);
// If item names don't match
string? xName = Path.GetFileName(TextHelper.RemovePathUnsafeCharacters(x.GetName() ?? string.Empty));
string? yName = Path.GetFileName(TextHelper.RemovePathUnsafeCharacters(y.GetName() ?? string.Empty));
if (xName != yName)
return nc.Compare(xName, yName);
// Otherwise, compare on machine or source, depending on the flag
int? xSourceIndex = x.GetFieldValue<Source?>(DatItem.SourceKey)?.Index;
int? ySourceIndex = y.GetFieldValue<Source?>(DatItem.SourceKey)?.Index;
return (norename ? nc.Compare(xMachineName, yMachineName) : (xSourceIndex - ySourceIndex) ?? 0);
}
catch
{
// Absorb the error
return 0;
}
});
return true;
}
/// <summary>
/// Sort a list of DatItem objects by SourceID, Game, and Name (in order)
/// </summary>
/// <param name="mappings">List of item ID to DatItem mappings representing the items to be sorted</param>
/// <param name="norename">True if files are not renamed, false otherwise</param>
/// <returns>True if it sorted correctly, false otherwise</returns>
public static bool SortDB(ref List<KeyValuePair<long, DatItem>> mappings, bool norename)
{
mappings.Sort(delegate (KeyValuePair<long, DatItem> x, KeyValuePair<long, DatItem> y)
{
try
{
var nc = new NaturalComparer();
// TODO: Fix this since DB uses an external map for machines
// If machine names don't match
string? xMachineName = x.Value.GetFieldValue<Machine>(DatItem.MachineKey)?.GetStringFieldValue(Models.Metadata.Machine.NameKey);
string? yMachineName = y.Value.GetFieldValue<Machine>(DatItem.MachineKey)?.GetStringFieldValue(Models.Metadata.Machine.NameKey);
if (xMachineName != yMachineName)
return nc.Compare(xMachineName, yMachineName);
// If types don't match
string? xType = x.Value.GetStringFieldValue(Models.Metadata.DatItem.TypeKey);
string? yType = y.Value.GetStringFieldValue(Models.Metadata.DatItem.TypeKey);
if (xType != yType)
return xType.AsEnumValue<ItemType>() - yType.AsEnumValue<ItemType>();
// If directory names don't match
string? xDirectoryName = Path.GetDirectoryName(TextHelper.RemovePathUnsafeCharacters(x.Value.GetName() ?? string.Empty));
string? yDirectoryName = Path.GetDirectoryName(TextHelper.RemovePathUnsafeCharacters(y.Value.GetName() ?? string.Empty));
if (xDirectoryName != yDirectoryName)
return nc.Compare(xDirectoryName, yDirectoryName);
// If item names don't match
string? xName = Path.GetFileName(TextHelper.RemovePathUnsafeCharacters(x.Value.GetName() ?? string.Empty));
string? yName = Path.GetFileName(TextHelper.RemovePathUnsafeCharacters(y.Value.GetName() ?? string.Empty));
if (xName != yName)
return nc.Compare(xName, yName);
// Otherwise, compare on machine or source, depending on the flag
int? xSourceIndex = x.Value.GetFieldValue<Source?>(DatItem.SourceKey)?.Index;
int? ySourceIndex = y.Value.GetFieldValue<Source?>(DatItem.SourceKey)?.Index;
return (norename ? nc.Compare(xMachineName, yMachineName) : (xSourceIndex - ySourceIndex) ?? 0);
}
catch
{
// Absorb the error
return 0;
}
});
return true;
}
#endregion
#region SuperDAT
/// <summary>
/// Apply SuperDAT naming logic to a merged DatFile
/// </summary>
/// <param name="datFile">Current DatFile object to run operations on</param>
/// <param name="inputs">List of inputs to use for renaming</param>
public static void ApplySuperDAT(DatFile datFile, List<ParentablePath> inputs)
{
2024-02-28 22:54:56 -05:00
#if NET452_OR_GREATER || NETCOREAPP
2025-01-14 15:59:47 -05:00
Parallel.ForEach(datFile.Items.SortedKeys, Core.Globals.ParallelOptions, key =>
2024-02-28 22:54:56 -05:00
#elif NET40_OR_GREATER
2025-01-14 15:59:47 -05:00
Parallel.ForEach(datFile.Items.SortedKeys, key =>
2024-02-28 22:54:56 -05:00
#else
2025-01-14 15:59:47 -05:00
foreach (var key in datFile.Items.SortedKeys)
2024-02-28 22:54:56 -05:00
#endif
{
List<DatItem>? items = datFile.GetItemsForBucket(key);
2024-02-28 19:19:50 -05:00
if (items == null)
2024-03-05 02:52:53 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2024-02-28 19:19:50 -05:00
return;
2024-03-05 02:52:53 -05:00
#else
continue;
#endif
2024-02-28 19:19:50 -05:00
List<DatItem> newItems = [];
foreach (DatItem item in items)
{
DatItem newItem = item;
var source = newItem.GetFieldValue<Source?>(DatItem.SourceKey);
if (source == null)
2024-02-28 19:19:50 -05:00
continue;
string filename = inputs[source.Index].CurrentPath;
string rootpath = inputs[source.Index].ParentPath ?? string.Empty;
if (rootpath.Length > 0
2024-02-29 00:14:16 -05:00
#if NETFRAMEWORK
&& !rootpath.EndsWith(Path.DirectorySeparatorChar.ToString())
&& !rootpath.EndsWith(Path.AltDirectorySeparatorChar.ToString()))
2024-02-29 00:14:16 -05:00
#else
&& !rootpath.EndsWith(Path.DirectorySeparatorChar)
&& !rootpath.EndsWith(Path.AltDirectorySeparatorChar))
2024-02-29 00:14:16 -05:00
#endif
{
rootpath += Path.DirectorySeparatorChar.ToString();
}
filename = filename.Remove(0, rootpath.Length);
var machine = newItem.GetFieldValue<Machine>(DatItem.MachineKey);
if (machine == null)
continue;
machine.SetFieldValue<string?>(Models.Metadata.Machine.NameKey, Path.GetDirectoryName(filename)
+ Path.DirectorySeparatorChar
+ Path.GetFileNameWithoutExtension(filename)
+ Path.DirectorySeparatorChar
+ machine.GetStringFieldValue(Models.Metadata.Machine.NameKey));
newItems.Add(newItem);
}
2025-01-14 15:32:14 -05:00
datFile.RemoveBucket(key);
newItems.ForEach(item => datFile.AddItem(item, statsOnly: false));
2024-02-28 21:59:13 -05:00
#if NET40_OR_GREATER || NETCOREAPP
});
2024-02-28 21:59:13 -05:00
#else
}
#endif
}
2024-03-20 00:36:47 -04:00
/// <summary>
/// Apply SuperDAT naming logic to a merged DatFile
/// </summary>
/// <param name="datFile">Current DatFile object to run operations on</param>
/// <param name="inputs">List of inputs to use for renaming</param>
public static void ApplySuperDATDB(DatFile datFile, List<ParentablePath> inputs)
{
List<string> keys = [.. datFile.ItemsDB.SortedKeys];
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.ForEach(keys, Core.Globals.ParallelOptions, key =>
2024-03-20 00:36:47 -04:00
#elif NET40_OR_GREATER
Parallel.ForEach(keys, key =>
#else
foreach (var key in keys)
#endif
{
var items = datFile.GetItemsForBucketDB(key);
2024-03-20 00:36:47 -04:00
if (items == null)
#if NET40_OR_GREATER || NETCOREAPP
return;
#else
continue;
#endif
foreach (var item in items)
2024-03-20 00:36:47 -04:00
{
var source = datFile.ItemsDB.GetSourceForItem(item.Key);
if (source.Value == null)
2024-03-20 00:36:47 -04:00
continue;
var machine = datFile.ItemsDB.GetMachineForItem(item.Key);
if (machine.Value == null)
2024-03-20 00:36:47 -04:00
continue;
string filename = inputs[source.Value.Index].CurrentPath;
string rootpath = inputs[source.Value.Index].ParentPath ?? string.Empty;
2024-03-20 00:36:47 -04:00
if (rootpath.Length > 0
2024-03-20 00:36:47 -04:00
#if NETFRAMEWORK
&& !rootpath!.EndsWith(Path.DirectorySeparatorChar.ToString())
&& !rootpath!.EndsWith(Path.AltDirectorySeparatorChar.ToString()))
#else
&& !rootpath.EndsWith(Path.DirectorySeparatorChar)
&& !rootpath.EndsWith(Path.AltDirectorySeparatorChar))
#endif
{
rootpath += Path.DirectorySeparatorChar.ToString();
}
filename = filename.Remove(0, rootpath.Length);
machine.Value.SetFieldValue<string?>(Models.Metadata.Machine.NameKey, Path.GetDirectoryName(filename) + Path.DirectorySeparatorChar
2024-03-20 00:36:47 -04:00
+ Path.GetFileNameWithoutExtension(filename) + Path.DirectorySeparatorChar
+ machine.Value.GetStringFieldValue(Models.Metadata.Machine.NameKey));
2024-03-20 00:36:47 -04:00
}
#if NET40_OR_GREATER || NETCOREAPP
});
#else
}
#endif
}
#endregion
#region Replacement
2020-12-10 14:47:38 -08:00
/// <summary>
/// Replace item values from the base set represented by the current DAT
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="intDat">DatFile to replace the values in</param>
2024-03-05 20:07:38 -05:00
/// <param name="machineFieldNames">List of machine field names representing what should be updated</param>
/// <param name="itemFieldNames">List of item field names representing what should be updated</param>
2020-12-10 14:47:38 -08:00
/// <param name="onlySame">True if descriptions should only be replaced if the game name is the same, false otherwise</param>
2020-12-13 13:22:06 -08:00
public static void BaseReplace(
DatFile datFile,
DatFile intDat,
2024-03-05 20:07:38 -05:00
List<string> machineFieldNames,
Dictionary<string, List<string>> itemFieldNames,
2020-12-13 13:22:06 -08:00
bool onlySame)
2020-12-10 14:47:38 -08:00
{
InternalStopwatch watch = new($"Replacing items in '{intDat.Header.GetStringFieldValue(DatHeader.FileNameKey)}' from the base DAT");
2020-12-10 14:47:38 -08:00
// If we are matching based on DatItem fields of any sort
if (itemFieldNames.Count > 0)
2020-12-10 14:47:38 -08:00
{
// For comparison's sake, we want to use CRC as the base bucketing
datFile.BucketBy(ItemKey.CRC);
datFile.Deduplicate(DedupeType.Full);
intDat.BucketBy(ItemKey.CRC);
2020-12-10 14:47:38 -08:00
// Then we do a hashwise comparison against the base DAT
2024-02-28 22:54:56 -05:00
#if NET452_OR_GREATER || NETCOREAPP
2025-01-14 15:32:14 -05:00
Parallel.ForEach(intDat.Items.SortedKeys, Core.Globals.ParallelOptions, key =>
2024-02-28 22:54:56 -05:00
#elif NET40_OR_GREATER
2025-01-14 15:32:14 -05:00
Parallel.ForEach(intDat.Items.SortedKeys, key =>
2024-02-28 22:54:56 -05:00
#else
2025-01-14 15:32:14 -05:00
foreach (var key in intDat.Items.SortedKeys)
2024-02-28 22:54:56 -05:00
#endif
2020-12-10 14:47:38 -08:00
{
List<DatItem>? datItems = intDat.GetItemsForBucket(key);
2024-02-28 19:19:50 -05:00
if (datItems == null)
2024-03-05 02:52:53 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2024-02-28 19:19:50 -05:00
return;
2024-03-05 02:52:53 -05:00
#else
continue;
#endif
2024-02-28 19:19:50 -05:00
List<DatItem> newDatItems = [];
2020-12-10 14:47:38 -08:00
foreach (DatItem datItem in datItems)
{
2025-01-14 15:39:34 -05:00
List<DatItem> dupes = datFile.GetDuplicates(datItem, sorted: true);
2024-02-28 19:19:50 -05:00
if (datItem.Clone() is not DatItem newDatItem)
continue;
2020-12-10 14:47:38 -08:00
// Replace fields from the first duplicate, if we have one
if (dupes.Count > 0)
Replacer.ReplaceFields(newDatItem, dupes[0], itemFieldNames);
2020-12-10 14:47:38 -08:00
newDatItems.Add(newDatItem);
}
// Now add the new list to the key
2025-01-14 15:32:14 -05:00
intDat.RemoveBucket(key);
newDatItems.ForEach(item => intDat.AddItem(item, statsOnly: false));
2024-02-28 21:59:13 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
});
2024-02-28 21:59:13 -05:00
#else
}
#endif
2020-12-10 14:47:38 -08:00
}
// If we are matching based on Machine fields of any sort
if (machineFieldNames.Count > 0)
2020-12-10 14:47:38 -08:00
{
// For comparison's sake, we want to use Machine Name as the base bucketing
datFile.BucketBy(ItemKey.Machine);
datFile.Deduplicate(DedupeType.Full);
intDat.BucketBy(ItemKey.Machine);
2020-12-10 14:47:38 -08:00
// Then we do a namewise comparison against the base DAT
2024-02-28 22:54:56 -05:00
#if NET452_OR_GREATER || NETCOREAPP
2025-01-14 15:32:14 -05:00
Parallel.ForEach(intDat.Items.SortedKeys, Core.Globals.ParallelOptions, key =>
2024-02-28 22:54:56 -05:00
#elif NET40_OR_GREATER
2025-01-14 15:32:14 -05:00
Parallel.ForEach(intDat.Items.SortedKeys, key =>
2024-02-28 22:54:56 -05:00
#else
2025-01-14 15:32:14 -05:00
foreach (var key in intDat.Items.SortedKeys)
2024-02-28 22:54:56 -05:00
#endif
2020-12-10 14:47:38 -08:00
{
List<DatItem>? datItems = intDat.GetItemsForBucket(key);
2024-02-28 19:19:50 -05:00
if (datItems == null)
2024-03-05 02:52:53 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2024-02-28 19:19:50 -05:00
return;
2024-03-05 02:52:53 -05:00
#else
continue;
#endif
2024-02-28 19:19:50 -05:00
List<DatItem> newDatItems = [];
2020-12-10 14:47:38 -08:00
foreach (DatItem datItem in datItems)
{
2024-02-28 19:19:50 -05:00
if (datItem.Clone() is not DatItem newDatItem)
continue;
var list = datFile.GetItemsForBucket(key);
if (list.Count > 0)
2024-03-10 16:49:07 -04:00
Replacer.ReplaceFields(newDatItem.GetFieldValue<Machine>(DatItem.MachineKey)!, list[index: 0].GetFieldValue<Machine>(DatItem.MachineKey)!, machineFieldNames, onlySame);
2020-12-10 14:47:38 -08:00
newDatItems.Add(newDatItem);
}
// Now add the new list to the key
2025-01-14 15:32:14 -05:00
intDat.RemoveBucket(key);
newDatItems.ForEach(item => intDat.AddItem(item, statsOnly: false));
2024-02-28 21:59:13 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
});
2024-02-28 21:59:13 -05:00
#else
}
#endif
2020-12-10 14:47:38 -08:00
}
2021-02-02 14:09:49 -08:00
watch.Stop();
2020-12-10 14:47:38 -08:00
}
2024-03-20 00:36:47 -04:00
/// <summary>
/// Replace item values from the base set represented by the current DAT
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="intDat">DatFile to replace the values in</param>
/// <param name="machineFieldNames">List of machine field names representing what should be updated</param>
/// <param name="itemFieldNames">List of item field names representing what should be updated</param>
/// <param name="onlySame">True if descriptions should only be replaced if the game name is the same, false otherwise</param>
public static void BaseReplaceDB(
DatFile datFile,
DatFile intDat,
List<string> machineFieldNames,
Dictionary<string, List<string>> itemFieldNames,
bool onlySame)
{
InternalStopwatch watch = new($"Replacing items in '{intDat.Header.GetStringFieldValue(DatHeader.FileNameKey)}' from the base DAT");
// If we are matching based on DatItem fields of any sort
if (itemFieldNames.Count > 0)
2024-03-20 00:36:47 -04:00
{
// For comparison's sake, we want to use CRC as the base bucketing
datFile.BucketBy(ItemKey.CRC);
datFile.Deduplicate(DedupeType.Full);
intDat.BucketBy(ItemKey.CRC);
2024-03-20 00:36:47 -04:00
// Then we do a hashwise comparison against the base DAT
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.ForEach(intDat.ItemsDB.SortedKeys, Core.Globals.ParallelOptions, key =>
2024-03-20 00:36:47 -04:00
#elif NET40_OR_GREATER
Parallel.ForEach(intDat.ItemsDB.SortedKeys, key =>
#else
foreach (var key in intDat.ItemsDB.SortedKeys)
#endif
{
var datItems = intDat.GetItemsForBucketDB(key);
2024-03-20 00:36:47 -04:00
if (datItems == null)
#if NET40_OR_GREATER || NETCOREAPP
return;
#else
continue;
#endif
foreach (var datItem in datItems)
2024-03-20 00:36:47 -04:00
{
var dupes = datFile.GetDuplicatesDB(datItem, sorted: true);
if (datItem.Value.Clone() is not DatItem newDatItem)
2024-03-20 00:36:47 -04:00
continue;
// Replace fields from the first duplicate, if we have one
if (dupes.Count > 0)
Replacer.ReplaceFields(datItem.Value, dupes.First().Value, itemFieldNames);
2024-03-20 00:36:47 -04:00
}
#if NET40_OR_GREATER || NETCOREAPP
});
#else
}
#endif
}
// If we are matching based on Machine fields of any sort
if (machineFieldNames.Count > 0)
2024-03-20 00:36:47 -04:00
{
// For comparison's sake, we want to use Machine Name as the base bucketing
datFile.BucketBy(ItemKey.Machine);
datFile.Deduplicate(DedupeType.Full);
intDat.BucketBy(ItemKey.Machine);
2024-03-20 00:36:47 -04:00
// Then we do a namewise comparison against the base DAT
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.ForEach(intDat.ItemsDB.SortedKeys, Core.Globals.ParallelOptions, key =>
2024-03-20 00:36:47 -04:00
#elif NET40_OR_GREATER
Parallel.ForEach(intDat.ItemsDB.SortedKeys, key =>
#else
foreach (var key in intDat.ItemsDB.SortedKeys)
#endif
{
var datItems = intDat.GetItemsForBucketDB(key);
2024-03-20 00:36:47 -04:00
if (datItems == null)
#if NET40_OR_GREATER || NETCOREAPP
return;
#else
continue;
#endif
foreach (var datItem in datItems)
2024-03-20 00:36:47 -04:00
{
var datMachine = datFile.ItemsDB.GetMachineForItem(datFile.GetItemsForBucketDB(key)!.First().Key);
var intMachine = intDat.ItemsDB.GetMachineForItem(datItem.Key);
if (datMachine.Value != null && intMachine.Value != null)
Replacer.ReplaceFields(intMachine.Value, datMachine.Value, machineFieldNames, onlySame);
2024-03-20 00:36:47 -04:00
}
#if NET40_OR_GREATER || NETCOREAPP
});
#else
}
#endif
}
watch.Stop();
}
#endregion
#region Diffing
2020-12-10 14:47:38 -08:00
/// <summary>
/// Output diffs against a base set represented by the current DAT
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="intDat">DatFile to replace the values in</param>
/// <param name="useGames">True to diff using games, false to use hashes</param>
public static void DiffAgainst(DatFile datFile, DatFile intDat, bool useGames)
{
InternalStopwatch watch = new($"Comparing '{intDat.Header.GetStringFieldValue(DatHeader.FileNameKey)}' to base DAT");
2020-12-10 14:47:38 -08:00
// For comparison's sake, we want to a the base bucketing
if (useGames)
{
intDat.BucketBy(ItemKey.Machine);
}
2020-12-10 14:47:38 -08:00
else
{
intDat.BucketBy(ItemKey.CRC);
intDat.Deduplicate(DedupeType.Full);
}
2020-12-10 14:47:38 -08:00
// Then we compare against the base DAT
2024-02-28 22:54:56 -05:00
#if NET452_OR_GREATER || NETCOREAPP
2025-01-14 15:59:47 -05:00
Parallel.ForEach(intDat.Items.SortedKeys, Core.Globals.ParallelOptions, key =>
2024-02-28 22:54:56 -05:00
#elif NET40_OR_GREATER
2025-01-14 15:59:47 -05:00
Parallel.ForEach(intDat.Items.SortedKeys, key =>
2024-02-28 22:54:56 -05:00
#else
2025-01-14 15:59:47 -05:00
foreach (var key in intDat.Items.SortedKeys)
2024-02-28 22:54:56 -05:00
#endif
2020-12-10 14:47:38 -08:00
{
// Game Against uses game names
if (useGames)
{
2024-02-28 19:19:50 -05:00
// If the key is null, keep it
var intList = intDat.GetItemsForBucket(key);
if (intList.Count == 0)
2024-03-05 02:52:53 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2024-02-28 19:19:50 -05:00
return;
2024-03-05 02:52:53 -05:00
#else
continue;
#endif
2024-02-28 19:19:50 -05:00
2020-12-10 14:47:38 -08:00
// If the base DAT doesn't contain the key, keep it
var list = datFile.GetItemsForBucket(key);
if (list.Count == 0)
2024-03-05 02:52:53 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
return;
2024-03-05 02:52:53 -05:00
#else
continue;
#endif
2020-12-10 14:47:38 -08:00
// If the number of items is different, then keep it
2024-02-28 19:19:50 -05:00
if (list.Count != intList.Count)
2024-03-05 02:52:53 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
return;
2024-03-05 02:52:53 -05:00
#else
continue;
#endif
2020-12-10 14:47:38 -08:00
// Otherwise, compare by name and hash the remaining files
bool exactMatch = true;
2024-02-28 19:19:50 -05:00
foreach (DatItem item in intList)
2020-12-10 14:47:38 -08:00
{
// TODO: Make this granular to name as well
2024-02-28 19:19:50 -05:00
if (!list.Contains(item))
2020-12-10 14:47:38 -08:00
{
exactMatch = false;
break;
}
}
// If we have an exact match, remove the game
if (exactMatch)
2025-01-14 15:32:14 -05:00
intDat.RemoveBucket(key);
2020-12-10 14:47:38 -08:00
}
// Standard Against uses hashes
else
{
List<DatItem>? datItems = intDat.GetItemsForBucket(key);
2024-02-28 19:19:50 -05:00
if (datItems == null)
2024-03-05 02:52:53 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2024-02-28 19:19:50 -05:00
return;
2024-03-05 02:52:53 -05:00
#else
continue;
#endif
2024-02-28 19:19:50 -05:00
List<DatItem> keepDatItems = [];
2020-12-10 14:47:38 -08:00
foreach (DatItem datItem in datItems)
{
if (!datFile.HasDuplicates(datItem, true))
2020-12-10 14:47:38 -08:00
keepDatItems.Add(datItem);
}
// Now add the new list to the key
2025-01-14 15:32:14 -05:00
intDat.RemoveBucket(key);
keepDatItems.ForEach(item => intDat.AddItem(item, statsOnly: false));
2020-12-10 14:47:38 -08:00
}
2024-02-28 21:59:13 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
});
2024-02-28 21:59:13 -05:00
#else
}
#endif
2021-02-02 14:09:49 -08:00
watch.Stop();
2020-12-10 14:47:38 -08:00
}
/// <summary>
/// Output cascading diffs
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="datHeaders">Dat headers used optionally</param>
/// <returns>List of DatFiles representing the individually indexed items</returns>
public static List<DatFile> DiffCascade(DatFile datFile, List<DatHeader> datHeaders)
{
// Create a list of DatData objects representing output files
2024-02-28 19:19:50 -05:00
List<DatFile> outDats = [];
2020-12-10 14:47:38 -08:00
// Ensure the current DatFile is sorted optimally
datFile.BucketBy(ItemKey.CRC);
2020-12-10 14:47:38 -08:00
// Loop through each of the inputs and get or create a new DatData object
InternalStopwatch watch = new("Initializing and filling all output DATs");
2020-12-10 14:47:38 -08:00
// Create the DatFiles from the set of headers
DatFile[] outDatsArray = new DatFile[datHeaders.Count];
2024-02-28 22:54:56 -05:00
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.For(0, datHeaders.Count, Core.Globals.ParallelOptions, j =>
2024-02-28 22:54:56 -05:00
#elif NET40_OR_GREATER
Parallel.For(0, datHeaders.Count, j =>
#else
for (int j = 0; j < datHeaders.Count; j++)
#endif
2020-12-10 14:47:38 -08:00
{
DatFile diffData = CreateDatFile(datHeaders[j]);
2024-03-19 18:40:24 -04:00
diffData.ResetDictionary();
2020-12-10 14:47:38 -08:00
FillWithSourceIndex(datFile, diffData, j);
FillWithSourceIndexDB(datFile, diffData, j);
2020-12-10 14:47:38 -08:00
outDatsArray[j] = diffData;
2024-02-28 22:54:56 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
});
2024-02-28 22:54:56 -05:00
#else
}
#endif
2020-12-10 14:47:38 -08:00
2024-02-28 19:19:50 -05:00
outDats = [.. outDatsArray];
2020-12-10 14:47:38 -08:00
watch.Stop();
return outDats;
}
/// <summary>
/// Output duplicate item diff
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="inputs">List of inputs to write out from</param>
public static DatFile DiffDuplicates(DatFile datFile, List<string> inputs)
{
2024-11-12 21:12:06 -05:00
List<ParentablePath> paths = inputs.ConvertAll(i => new ParentablePath(i));
2020-12-10 14:47:38 -08:00
return DiffDuplicates(datFile, paths);
2024-03-20 00:36:47 -04:00
//return DiffDuplicatesDB(datFile, paths);
2020-12-10 14:47:38 -08:00
}
/// <summary>
/// Output duplicate item diff
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="inputs">List of inputs to write out from</param>
public static DatFile DiffDuplicates(DatFile datFile, List<ParentablePath> inputs)
{
InternalStopwatch watch = new("Initializing duplicate DAT");
2020-12-10 14:47:38 -08:00
// Fill in any information not in the base DAT
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(DatHeader.FileNameKey)))
2024-03-10 21:41:49 -04:00
datFile.Header.SetFieldValue<string?>(DatHeader.FileNameKey, "All DATs");
2020-12-10 14:47:38 -08:00
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.NameKey)))
2024-03-10 04:10:37 -04:00
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, "datFile.All DATs");
2020-12-10 14:47:38 -08:00
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey)))
2024-03-10 04:10:37 -04:00
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, "datFile.All DATs");
2020-12-10 14:47:38 -08:00
string post = " (Duplicates)";
DatFile dupeData = CreateDatFile(datFile.Header);
dupeData.Header.SetFieldValue<string?>(DatHeader.FileNameKey, dupeData.Header.GetStringFieldValue(DatHeader.FileNameKey) + post);
dupeData.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, dupeData.Header.GetStringFieldValue(Models.Metadata.Header.NameKey) + post);
dupeData.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, dupeData.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey) + post);
2024-03-19 18:40:24 -04:00
dupeData.ResetDictionary();
2020-12-10 14:47:38 -08:00
watch.Stop();
// Now, loop through the dictionary and populate the correct DATs
watch.Start("Populating duplicate DAT");
2024-02-28 22:54:56 -05:00
#if NET452_OR_GREATER || NETCOREAPP
2025-01-14 15:32:14 -05:00
Parallel.ForEach(datFile.Items.SortedKeys, Core.Globals.ParallelOptions, key =>
2024-02-28 22:54:56 -05:00
#elif NET40_OR_GREATER
2025-01-14 15:32:14 -05:00
Parallel.ForEach(datFile.Items.SortedKeys, key =>
2024-02-28 22:54:56 -05:00
#else
2025-01-14 15:32:14 -05:00
foreach (var key in datFile.Items.SortedKeys)
2024-02-28 22:54:56 -05:00
#endif
2020-12-10 14:47:38 -08:00
{
List<DatItem> items = Merge(datFile.GetItemsForBucket(key));
2020-12-10 14:47:38 -08:00
// If the rom list is empty or null, just skip it
if (items == null || items.Count == 0)
2024-02-29 00:14:16 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
return;
2024-02-29 00:14:16 -05:00
#else
continue;
#endif
2020-12-10 14:47:38 -08:00
// Loop through and add the items correctly
foreach (DatItem item in items)
{
2024-12-28 20:15:32 -05:00
#if NET20 || NET35
2024-03-10 16:49:07 -04:00
if ((item.GetFieldValue<DupeType>(DatItem.DupeTypeKey) & DupeType.External) != 0)
2024-02-28 22:54:56 -05:00
#else
2024-03-10 16:49:07 -04:00
if (item.GetFieldValue<DupeType>(DatItem.DupeTypeKey).HasFlag(DupeType.External))
2024-02-28 22:54:56 -05:00
#endif
2020-12-10 14:47:38 -08:00
{
2024-02-28 19:19:50 -05:00
if (item.Clone() is not DatItem newrom)
continue;
2024-03-10 16:49:07 -04:00
if (item.GetFieldValue<Source?>(DatItem.SourceKey) != null)
newrom.GetFieldValue<Machine>(DatItem.MachineKey)!.SetFieldValue<string?>(Models.Metadata.Machine.NameKey, newrom.GetFieldValue<Machine>(DatItem.MachineKey)!.GetStringFieldValue(Models.Metadata.Machine.NameKey) + $" ({Path.GetFileNameWithoutExtension(inputs[item.GetFieldValue<Source?>(DatItem.SourceKey)!.Index].CurrentPath)})");
2020-12-10 14:47:38 -08:00
2025-01-14 15:32:14 -05:00
dupeData.AddItem(newrom, statsOnly: false);
2020-12-10 14:47:38 -08:00
}
}
2024-02-28 21:59:13 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
});
2024-02-28 21:59:13 -05:00
#else
}
#endif
2020-12-10 14:47:38 -08:00
watch.Stop();
return dupeData;
}
2024-03-20 00:36:47 -04:00
/// <summary>
/// Output duplicate item diff
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="inputs">List of inputs to write out from</param>
public static DatFile DiffDuplicatesDB(DatFile datFile, List<ParentablePath> inputs)
{
var watch = new InternalStopwatch("Initializing duplicate DAT");
2024-03-20 00:36:47 -04:00
// Fill in any information not in the base DAT
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(DatHeader.FileNameKey)))
datFile.Header.SetFieldValue<string?>(DatHeader.FileNameKey, "All DATs");
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.NameKey)))
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, "datFile.All DATs");
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey)))
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, "datFile.All DATs");
string post = " (Duplicates)";
DatFile dupeData = CreateDatFile(datFile.Header);
2024-03-20 00:36:47 -04:00
dupeData.Header.SetFieldValue<string?>(DatHeader.FileNameKey, dupeData.Header.GetStringFieldValue(DatHeader.FileNameKey) + post);
dupeData.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, dupeData.Header.GetStringFieldValue(Models.Metadata.Header.NameKey) + post);
dupeData.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, dupeData.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey) + post);
dupeData.ResetDictionary();
watch.Stop();
// Now, loop through the dictionary and populate the correct DATs
watch.Start("Populating duplicate DAT");
// Get all current items, machines, and mappings
var datItems = datFile.ItemsDB.GetItems();
var machines = datFile.GetMachinesDB();
var sources = datFile.ItemsDB.GetSources();
var itemMachineMappings = datFile.ItemsDB.GetItemMachineMappings();
var itemSourceMappings = datFile.ItemsDB.GetItemSourceMappings();
2024-03-20 00:36:47 -04:00
2024-03-20 01:29:59 -04:00
// Create mappings from old index to new index
2024-03-20 00:36:47 -04:00
var machineRemapping = new Dictionary<long, long>();
2024-03-20 01:29:59 -04:00
var sourceRemapping = new Dictionary<long, long>();
// Loop through and add all sources
foreach (var source in sources)
{
long newSourceIndex = dupeData.AddSourceDB(source.Value);
2024-03-20 01:29:59 -04:00
sourceRemapping[source.Key] = newSourceIndex;
}
2024-03-20 00:36:47 -04:00
// Loop through and add all machines
foreach (var machine in machines)
{
long newMachineIndex = dupeData.AddMachineDB(machine.Value);
2024-03-20 00:36:47 -04:00
machineRemapping[machine.Key] = newMachineIndex;
}
// Loop through and add the items
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.ForEach(datItems, Core.Globals.ParallelOptions, item =>
2024-03-20 00:36:47 -04:00
#elif NET40_OR_GREATER
Parallel.ForEach(datItems, item =>
#else
foreach (var item in datItems)
#endif
{
2024-03-20 01:29:59 -04:00
// Get the machine and source index for this item
long machineIndex = itemMachineMappings[item.Key];
long sourceIndex = itemSourceMappings[item.Key];
2024-03-20 00:36:47 -04:00
// If the current item isn't an external duplicate
2024-12-28 20:15:32 -05:00
#if NET20 || NET35
if ((item.Value.GetFieldValue<DupeType>(DatItem.DupeTypeKey) & DupeType.External) == 0)
2024-03-20 00:36:47 -04:00
#else
if (!item.Value.GetFieldValue<DupeType>(DatItem.DupeTypeKey).HasFlag(DupeType.External))
2024-03-20 00:36:47 -04:00
#endif
#if NET40_OR_GREATER || NETCOREAPP
return;
2024-03-20 00:36:47 -04:00
#else
continue;
2024-03-20 00:36:47 -04:00
#endif
// Get the current source and machine
var currentSource = sources[sourceIndex];
string? currentMachineName = machines[machineIndex].GetStringFieldValue(Models.Metadata.Machine.NameKey);
var currentMachine = datFile.ItemsDB.GetMachine(currentMachineName);
if (currentMachine.Value == null)
#if NET40_OR_GREATER || NETCOREAPP
return;
#else
continue;
#endif
// Get the source-specific machine
string? renamedMachineName = $"{currentMachineName} ({Path.GetFileNameWithoutExtension(inputs[currentSource!.Index].CurrentPath)})";
var renamedMachine = datFile.ItemsDB.GetMachine(renamedMachineName);
if (renamedMachine.Value == null)
{
var newMachine = currentMachine.Value.Clone() as Machine;
newMachine!.SetFieldValue<string?>(Models.Metadata.Machine.NameKey, renamedMachineName);
long newMachineIndex = dupeData.AddMachineDB(newMachine!);
renamedMachine = new KeyValuePair<long, Machine?>(newMachineIndex, newMachine);
2024-03-20 00:36:47 -04:00
}
dupeData.AddItemDB(item.Value, renamedMachine.Key, sourceRemapping[sourceIndex], statsOnly: false);
2024-03-20 00:36:47 -04:00
#if NET40_OR_GREATER || NETCOREAPP
});
#else
}
#endif
watch.Stop();
return dupeData;
}
2020-12-10 14:47:38 -08:00
/// <summary>
/// Output non-cascading diffs
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="inputs">List of inputs to write out from</param>
public static List<DatFile> DiffIndividuals(DatFile datFile, List<string> inputs)
{
2024-11-12 21:12:06 -05:00
List<ParentablePath> paths = inputs.ConvertAll(i => new ParentablePath(i));
2020-12-10 14:47:38 -08:00
return DiffIndividuals(datFile, paths);
2024-03-20 00:36:47 -04:00
//return DiffIndividualsDB(datFile, paths);
2020-12-10 14:47:38 -08:00
}
/// <summary>
/// Output non-cascading diffs
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="inputs">List of inputs to write out from</param>
public static List<DatFile> DiffIndividuals(DatFile datFile, List<ParentablePath> inputs)
{
InternalStopwatch watch = new("Initializing all individual DATs");
2020-12-10 14:47:38 -08:00
// Fill in any information not in the base DAT
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(DatHeader.FileNameKey)))
2024-03-10 21:41:49 -04:00
datFile.Header.SetFieldValue<string?>(DatHeader.FileNameKey, "All DATs");
2020-12-10 14:47:38 -08:00
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.NameKey)))
2024-03-10 04:10:37 -04:00
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, "All DATs");
2020-12-10 14:47:38 -08:00
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey)))
2024-03-10 04:10:37 -04:00
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, "All DATs");
2020-12-10 14:47:38 -08:00
// Loop through each of the inputs and get or create a new DatData object
DatFile[] outDatsArray = new DatFile[inputs.Count];
2024-02-28 22:54:56 -05:00
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.For(0, inputs.Count, Core.Globals.ParallelOptions, j =>
2024-02-28 22:54:56 -05:00
#elif NET40_OR_GREATER
Parallel.For(0, inputs.Count, j =>
#else
for (int j = 0; j < inputs.Count; j++)
#endif
2020-12-10 14:47:38 -08:00
{
string innerpost = $" ({j} - {inputs[j].GetNormalizedFileName(true)} Only)";
DatFile diffData = CreateDatFile(datFile.Header);
diffData.Header.SetFieldValue<string?>(DatHeader.FileNameKey, diffData.Header.GetStringFieldValue(DatHeader.FileNameKey) + innerpost);
diffData.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, diffData.Header.GetStringFieldValue(Models.Metadata.Header.NameKey) + innerpost);
diffData.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, diffData.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey) + innerpost);
2024-03-19 18:40:24 -04:00
diffData.ResetDictionary();
2020-12-10 14:47:38 -08:00
outDatsArray[j] = diffData;
2024-02-28 22:54:56 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
});
2024-02-28 22:54:56 -05:00
#else
}
#endif
2020-12-10 14:47:38 -08:00
// Create a list of DatData objects representing individual output files
2024-02-28 19:19:50 -05:00
List<DatFile> outDats = [.. outDatsArray];
2020-12-10 14:47:38 -08:00
watch.Stop();
// Now, loop through the dictionary and populate the correct DATs
watch.Start("Populating all individual DATs");
2024-02-28 22:54:56 -05:00
#if NET452_OR_GREATER || NETCOREAPP
2025-01-14 15:32:14 -05:00
Parallel.ForEach(datFile.Items.SortedKeys, Core.Globals.ParallelOptions, key =>
2024-02-28 22:54:56 -05:00
#elif NET40_OR_GREATER
2025-01-14 15:32:14 -05:00
Parallel.ForEach(datFile.Items.SortedKeys, key =>
2024-02-28 22:54:56 -05:00
#else
2025-01-14 15:32:14 -05:00
foreach (var key in datFile.Items.SortedKeys)
2024-02-28 22:54:56 -05:00
#endif
2020-12-10 14:47:38 -08:00
{
List<DatItem> items = Merge(datFile.GetItemsForBucket(key));
2020-12-10 14:47:38 -08:00
// If the rom list is empty or null, just skip it
if (items == null || items.Count == 0)
2024-02-29 00:14:16 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
return;
2024-02-29 00:14:16 -05:00
#else
continue;
#endif
2020-12-10 14:47:38 -08:00
// Loop through and add the items correctly
foreach (DatItem item in items)
{
2024-03-10 16:49:07 -04:00
if (item.GetFieldValue<Source?>(DatItem.SourceKey) == null)
2024-02-28 19:19:50 -05:00
continue;
2024-12-28 20:15:32 -05:00
#if NET20 || NET35
2024-03-10 16:49:07 -04:00
if ((item.GetFieldValue<DupeType>(DatItem.DupeTypeKey) & DupeType.Internal) != 0 || item.GetFieldValue<DupeType>(DatItem.DupeTypeKey) == 0x00)
2024-02-28 22:54:56 -05:00
#else
2024-03-10 16:49:07 -04:00
if (item.GetFieldValue<DupeType>(DatItem.DupeTypeKey).HasFlag(DupeType.Internal) || item.GetFieldValue<DupeType>(DatItem.DupeTypeKey) == 0x00)
2024-02-28 22:54:56 -05:00
#endif
2025-01-14 15:32:14 -05:00
outDats[item.GetFieldValue<Source?>(DatItem.SourceKey)!.Index].AddItem(item, statsOnly: false);
2020-12-10 14:47:38 -08:00
}
2024-02-28 21:59:13 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
});
2024-02-28 21:59:13 -05:00
#else
}
#endif
2020-12-10 14:47:38 -08:00
watch.Stop();
2024-02-28 19:19:50 -05:00
return [.. outDats];
2020-12-10 14:47:38 -08:00
}
2024-03-20 00:36:47 -04:00
/// <summary>
/// Output non-cascading diffs
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="inputs">List of inputs to write out from</param>
public static List<DatFile> DiffIndividualsDB(DatFile datFile, List<ParentablePath> inputs)
{
InternalStopwatch watch = new("Initializing all individual DATs");
// Fill in any information not in the base DAT
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(DatHeader.FileNameKey)))
datFile.Header.SetFieldValue<string?>(DatHeader.FileNameKey, "All DATs");
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.NameKey)))
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, "All DATs");
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey)))
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, "All DATs");
// Loop through each of the inputs and get or create a new DatData object
DatFile[] outDatsArray = new DatFile[inputs.Count];
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.For(0, inputs.Count, Core.Globals.ParallelOptions, j =>
2024-03-20 00:36:47 -04:00
#elif NET40_OR_GREATER
Parallel.For(0, inputs.Count, j =>
#else
for (int j = 0; j < inputs.Count; j++)
#endif
{
string innerpost = $" ({j} - {inputs[j].GetNormalizedFileName(true)} Only)";
DatFile diffData = CreateDatFile(datFile.Header);
2024-03-20 00:36:47 -04:00
diffData.Header.SetFieldValue<string?>(DatHeader.FileNameKey, diffData.Header.GetStringFieldValue(DatHeader.FileNameKey) + innerpost);
diffData.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, diffData.Header.GetStringFieldValue(Models.Metadata.Header.NameKey) + innerpost);
diffData.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, diffData.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey) + innerpost);
diffData.ResetDictionary();
outDatsArray[j] = diffData;
#if NET40_OR_GREATER || NETCOREAPP
});
#else
}
#endif
// Create a list of DatData objects representing individual output files
List<DatFile> outDats = [.. outDatsArray];
watch.Stop();
// Now, loop through the dictionary and populate the correct DATs
watch.Start("Populating all individual DATs");
// Get all current items, machines, and mappings
var datItems = datFile.ItemsDB.GetItems();
var machines = datFile.GetMachinesDB();
var sources = datFile.ItemsDB.GetSources();
var itemMachineMappings = datFile.ItemsDB.GetItemMachineMappings();
var itemSourceMappings = datFile.ItemsDB.GetItemSourceMappings();
2024-03-20 00:36:47 -04:00
2024-03-20 01:29:59 -04:00
// Create mappings from old index to new index
2024-03-20 00:36:47 -04:00
var machineRemapping = new Dictionary<long, long>();
2024-03-20 01:29:59 -04:00
var sourceRemapping = new Dictionary<long, long>();
// Loop through and add all sources
foreach (var source in sources)
{
long newSourceIndex = outDats[0].AddSourceDB(source.Value);
2024-03-20 01:29:59 -04:00
sourceRemapping[source.Key] = newSourceIndex;
for (int i = 1; i < outDats.Count; i++)
{
_ = outDats[i].AddSourceDB(source.Value);
2024-03-20 01:29:59 -04:00
}
}
2024-03-20 00:36:47 -04:00
// Loop through and add all machines
foreach (var machine in machines)
{
long newMachineIndex = outDats[0].AddMachineDB(machine.Value);
2024-03-20 00:36:47 -04:00
machineRemapping[machine.Key] = newMachineIndex;
for (int i = 1; i < outDats.Count; i++)
{
_ = outDats[i].AddMachineDB(machine.Value);
2024-03-20 00:36:47 -04:00
}
}
// Loop through and add the items
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.ForEach(datItems, Core.Globals.ParallelOptions, item =>
2024-03-20 00:36:47 -04:00
#elif NET40_OR_GREATER
Parallel.ForEach(datItems, item =>
#else
foreach (var item in datItems)
#endif
{
2024-03-20 01:29:59 -04:00
// Get the machine and source index for this item
long machineIndex = itemMachineMappings[item.Key];
long sourceIndex = itemSourceMappings[item.Key];
2024-03-20 00:36:47 -04:00
// Get the source associated with the item
var source = datFile.ItemsDB.GetSource(sourceIndex);
if (source == null)
2024-03-20 00:36:47 -04:00
#if NET40_OR_GREATER || NETCOREAPP
return;
#else
continue;
#endif
2024-12-28 20:15:32 -05:00
#if NET20 || NET35
2024-03-20 00:36:47 -04:00
if ((item.Value.GetFieldValue<DupeType>(DatItem.DupeTypeKey) & DupeType.Internal) != 0 || item.Value.GetFieldValue<DupeType>(DatItem.DupeTypeKey) == 0x00)
#else
if (item.Value.GetFieldValue<DupeType>(DatItem.DupeTypeKey).HasFlag(DupeType.Internal) || item.Value.GetFieldValue<DupeType>(DatItem.DupeTypeKey) == 0x00)
#endif
outDats[source.Index].AddItemDB(item.Value, machineRemapping[machineIndex], sourceRemapping[sourceIndex], statsOnly: false);
2024-03-20 00:36:47 -04:00
#if NET40_OR_GREATER || NETCOREAPP
});
#else
}
#endif
watch.Stop();
return [.. outDats];
}
2020-12-10 14:47:38 -08:00
/// <summary>
/// Output non-duplicate item diff
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="inputs">List of inputs to write out from</param>
public static DatFile DiffNoDuplicates(DatFile datFile, List<string> inputs)
{
2024-11-12 21:12:06 -05:00
List<ParentablePath> paths = inputs.ConvertAll(i => new ParentablePath(i));
2020-12-10 14:47:38 -08:00
return DiffNoDuplicates(datFile, paths);
2024-03-20 00:36:47 -04:00
//return DiffNoDuplicatesDB(datFile, paths);
2020-12-10 14:47:38 -08:00
}
/// <summary>
/// Output non-duplicate item diff
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="inputs">List of inputs to write out from</param>
public static DatFile DiffNoDuplicates(DatFile datFile, List<ParentablePath> inputs)
{
InternalStopwatch watch = new("Initializing no duplicate DAT");
2020-12-10 14:47:38 -08:00
// Fill in any information not in the base DAT
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(DatHeader.FileNameKey)))
2024-03-10 21:41:49 -04:00
datFile.Header.SetFieldValue<string?>(DatHeader.FileNameKey, "All DATs");
2020-12-10 14:47:38 -08:00
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.NameKey)))
2024-03-10 04:10:37 -04:00
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, "All DATs");
2020-12-10 14:47:38 -08:00
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey)))
2024-03-10 04:10:37 -04:00
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, "All DATs");
2020-12-10 14:47:38 -08:00
string post = " (No Duplicates)";
DatFile outerDiffData = CreateDatFile(datFile.Header);
outerDiffData.Header.SetFieldValue<string?>(DatHeader.FileNameKey, outerDiffData.Header.GetStringFieldValue(DatHeader.FileNameKey) + post);
outerDiffData.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, outerDiffData.Header.GetStringFieldValue(Models.Metadata.Header.NameKey) + post);
outerDiffData.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, outerDiffData.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey) + post);
2024-03-19 18:40:24 -04:00
outerDiffData.ResetDictionary();
2020-12-10 14:47:38 -08:00
watch.Stop();
// Now, loop through the dictionary and populate the correct DATs
watch.Start("Populating no duplicate DAT");
2024-02-28 22:54:56 -05:00
#if NET452_OR_GREATER || NETCOREAPP
2025-01-14 15:32:14 -05:00
Parallel.ForEach(datFile.Items.SortedKeys, Core.Globals.ParallelOptions, key =>
2024-02-28 22:54:56 -05:00
#elif NET40_OR_GREATER
2025-01-14 15:32:14 -05:00
Parallel.ForEach(datFile.Items.SortedKeys, key =>
2024-02-28 22:54:56 -05:00
#else
2025-01-14 15:32:14 -05:00
foreach (var key in datFile.Items.SortedKeys)
2024-02-28 22:54:56 -05:00
#endif
2020-12-10 14:47:38 -08:00
{
List<DatItem> items = Merge(datFile.GetItemsForBucket(key));
2020-12-10 14:47:38 -08:00
// If the rom list is empty or null, just skip it
if (items == null || items.Count == 0)
2024-02-29 00:14:16 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
return;
2024-02-29 00:14:16 -05:00
#else
continue;
#endif
2020-12-10 14:47:38 -08:00
// Loop through and add the items correctly
foreach (DatItem item in items)
{
2024-12-28 20:15:32 -05:00
#if NET20 || NET35
2024-03-10 16:49:07 -04:00
if ((item.GetFieldValue<DupeType>(DatItem.DupeTypeKey) & DupeType.Internal) != 0 || item.GetFieldValue<DupeType>(DatItem.DupeTypeKey) == 0x00)
2024-02-28 22:54:56 -05:00
#else
2024-03-10 16:49:07 -04:00
if (item.GetFieldValue<DupeType>(DatItem.DupeTypeKey).HasFlag(DupeType.Internal) || item.GetFieldValue<DupeType>(DatItem.DupeTypeKey) == 0x00)
2024-02-28 22:54:56 -05:00
#endif
2020-12-10 14:47:38 -08:00
{
2024-03-10 16:49:07 -04:00
if (item.Clone() is not DatItem newrom || newrom.GetFieldValue<Source?>(DatItem.SourceKey) == null)
2024-02-28 19:19:50 -05:00
continue;
newrom.GetFieldValue<Machine>(DatItem.MachineKey)!.SetFieldValue<string?>(Models.Metadata.Machine.NameKey, newrom.GetFieldValue<Machine>(DatItem.MachineKey)!.GetStringFieldValue(Models.Metadata.Machine.NameKey) + $" ({Path.GetFileNameWithoutExtension(inputs[newrom.GetFieldValue<Source?>(DatItem.SourceKey)!.Index].CurrentPath)})");
2025-01-14 15:32:14 -05:00
outerDiffData.AddItem(newrom, statsOnly: false);
2020-12-10 14:47:38 -08:00
}
}
2024-02-28 21:59:13 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
});
2024-02-28 21:59:13 -05:00
#else
}
#endif
2020-12-10 14:47:38 -08:00
watch.Stop();
return outerDiffData;
}
2024-03-20 00:36:47 -04:00
/// <summary>
/// Output non-duplicate item diff
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="inputs">List of inputs to write out from</param>
public static DatFile DiffNoDuplicatesDB(DatFile datFile, List<ParentablePath> inputs)
{
var watch = new InternalStopwatch("Initializing no duplicate DAT");
2024-03-20 00:36:47 -04:00
// Fill in any information not in the base DAT
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(DatHeader.FileNameKey)))
datFile.Header.SetFieldValue<string?>(DatHeader.FileNameKey, "All DATs");
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.NameKey)))
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, "All DATs");
if (string.IsNullOrEmpty(datFile.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey)))
datFile.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, "All DATs");
string post = " (No Duplicates)";
DatFile outerDiffData = CreateDatFile(datFile.Header);
2024-03-20 00:36:47 -04:00
outerDiffData.Header.SetFieldValue<string?>(DatHeader.FileNameKey, outerDiffData.Header.GetStringFieldValue(DatHeader.FileNameKey) + post);
outerDiffData.Header.SetFieldValue<string?>(Models.Metadata.Header.NameKey, outerDiffData.Header.GetStringFieldValue(Models.Metadata.Header.NameKey) + post);
outerDiffData.Header.SetFieldValue<string?>(Models.Metadata.Header.DescriptionKey, outerDiffData.Header.GetStringFieldValue(Models.Metadata.Header.DescriptionKey) + post);
outerDiffData.ResetDictionary();
watch.Stop();
// Now, loop through the dictionary and populate the correct DATs
watch.Start("Populating no duplicate DAT");
// Get all current items, machines, and mappings
var datItems = datFile.ItemsDB.GetItems();
var machines = datFile.GetMachinesDB();
var sources = datFile.ItemsDB.GetSources();
var itemMachineMappings = datFile.ItemsDB.GetItemMachineMappings();
var itemSourceMappings = datFile.ItemsDB.GetItemSourceMappings();
2024-03-20 00:36:47 -04:00
2024-03-20 01:29:59 -04:00
// Create mappings from old index to new index
2024-03-20 00:36:47 -04:00
var machineRemapping = new Dictionary<long, long>();
2024-03-20 01:29:59 -04:00
var sourceRemapping = new Dictionary<long, long>();
// Loop through and add all sources
foreach (var source in sources)
{
long newSourceIndex = outerDiffData.AddSourceDB(source.Value);
2024-03-20 01:29:59 -04:00
sourceRemapping[source.Key] = newSourceIndex;
}
2024-03-20 00:36:47 -04:00
// Loop through and add all machines
foreach (var machine in machines)
{
long newMachineIndex = outerDiffData.AddMachineDB(machine.Value);
2024-03-20 00:36:47 -04:00
machineRemapping[machine.Key] = newMachineIndex;
}
// Loop through and add the items
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.ForEach(datItems, Core.Globals.ParallelOptions, item =>
2024-03-20 00:36:47 -04:00
#elif NET40_OR_GREATER
Parallel.ForEach(datItems, item =>
#else
foreach (var item in datItems)
#endif
{
2024-03-20 01:29:59 -04:00
// Get the machine and source index for this item
long machineIndex = itemMachineMappings[item.Key];
long sourceIndex = itemSourceMappings[item.Key];
2024-03-20 00:36:47 -04:00
// If the current item isn't a duplicate
2024-12-28 20:15:32 -05:00
#if NET20 || NET35
if ((item.Value.GetFieldValue<DupeType>(DatItem.DupeTypeKey) & DupeType.Internal) == 0 && item.Value.GetFieldValue<DupeType>(DatItem.DupeTypeKey) != 0x00)
2024-03-20 00:36:47 -04:00
#else
if (!item.Value.GetFieldValue<DupeType>(DatItem.DupeTypeKey).HasFlag(DupeType.Internal) && item.Value.GetFieldValue<DupeType>(DatItem.DupeTypeKey) != 0x00)
2024-03-20 00:36:47 -04:00
#endif
#if NET40_OR_GREATER || NETCOREAPP
return;
2024-03-20 00:36:47 -04:00
#else
continue;
#endif
// Get the current source and machine
var currentSource = sources[sourceIndex];
string? currentMachineName = machines[machineIndex].GetStringFieldValue(Models.Metadata.Machine.NameKey);
var currentMachine = datFile.ItemsDB.GetMachine(currentMachineName);
if (currentMachine.Value == null)
#if NET40_OR_GREATER || NETCOREAPP
return;
#else
continue;
2024-03-20 00:36:47 -04:00
#endif
// Get the source-specific machine
string? renamedMachineName = $"{currentMachineName} ({Path.GetFileNameWithoutExtension(inputs[currentSource!.Index].CurrentPath)})";
var renamedMachine = datFile.ItemsDB.GetMachine(renamedMachineName);
if (renamedMachine.Value == null)
{
var newMachine = currentMachine.Value.Clone() as Machine;
newMachine!.SetFieldValue<string?>(Models.Metadata.Machine.NameKey, renamedMachineName);
long newMachineIndex = outerDiffData.AddMachineDB(newMachine);
renamedMachine = new KeyValuePair<long, Machine?>(newMachineIndex, newMachine);
2024-03-20 00:36:47 -04:00
}
outerDiffData.AddItemDB(item.Value, renamedMachine.Key, sourceRemapping[sourceIndex], statsOnly: false);
2024-03-20 00:36:47 -04:00
#if NET40_OR_GREATER || NETCOREAPP
});
#else
}
#endif
watch.Stop();
return outerDiffData;
}
#endregion
#region Population
2020-12-10 14:47:38 -08:00
/// <summary>
/// Populate from multiple paths while returning the invividual headers
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="inputs">Paths to DATs to parse</param>
/// <returns>List of DatHeader objects representing headers</returns>
public static List<DatHeader> PopulateUserData(DatFile datFile, List<string> inputs)
{
2024-11-12 21:12:06 -05:00
List<ParentablePath> paths = inputs.ConvertAll(i => new ParentablePath(i));
2020-12-10 14:47:38 -08:00
return PopulateUserData(datFile, paths);
}
/// <summary>
/// Populate from multiple paths while returning the invividual headers
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="inputs">Paths to DATs to parse</param>
/// <returns>List of DatHeader objects representing headers</returns>
public static List<DatHeader> PopulateUserData(DatFile datFile, List<ParentablePath> inputs)
{
DatFile[] datFiles = new DatFile[inputs.Count];
InternalStopwatch watch = new("Processing individual DATs");
2020-12-10 14:47:38 -08:00
// Parse all of the DATs into their own DatFiles in the array
2024-02-28 22:54:56 -05:00
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.For(0, inputs.Count, Core.Globals.ParallelOptions, i =>
2024-02-28 22:54:56 -05:00
#elif NET40_OR_GREATER
Parallel.For(0, inputs.Count, i =>
#else
for (int i = 0; i < inputs.Count; i++)
#endif
2020-12-10 14:47:38 -08:00
{
var input = inputs[i];
2025-01-08 16:59:44 -05:00
_staticLogger.User($"Adding DAT: {input.CurrentPath}");
datFiles[i] = CreateDatFile(datFile.Header.CloneFiltering());
2020-12-10 14:47:38 -08:00
Parser.ParseInto(datFiles[i], input, i, keep: true);
2024-02-28 22:54:56 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2020-12-10 14:47:38 -08:00
});
2024-02-28 22:54:56 -05:00
#else
}
#endif
2020-12-10 14:47:38 -08:00
watch.Stop();
watch.Start("Populating internal DAT");
for (int i = 0; i < inputs.Count; i++)
{
AddFromExisting(datFile, datFiles[i], true);
2024-03-20 00:36:47 -04:00
//AddFromExistingDB(datFile, datFiles[i], true);
2020-12-10 14:47:38 -08:00
}
watch.Stop();
2024-11-12 21:12:06 -05:00
return [.. Array.ConvertAll(datFiles, d => d.Header)];
2020-12-10 14:47:38 -08:00
}
2024-02-28 22:54:56 -05:00
2020-12-10 14:47:38 -08:00
/// <summary>
/// Add items from another DatFile to the existing DatFile
/// </summary>
/// <param name="addTo">DatFile to add to</param>
/// <param name="addFrom">DatFile to add from</param>
/// <param name="delete">If items should be deleted from the source DatFile</param>
private static void AddFromExisting(DatFile addTo, DatFile addFrom, bool delete = false)
{
// Get the list of keys from the DAT
2025-01-14 15:59:47 -05:00
foreach (string key in addFrom.Items.SortedKeys)
2020-12-10 14:47:38 -08:00
{
// Add everything from the key to the internal DAT
2025-01-14 15:32:14 -05:00
addFrom.GetItemsForBucket(key).ForEach(item => addTo.AddItem(item, statsOnly: false));
2020-12-10 14:47:38 -08:00
// Now remove the key from the source DAT
if (delete)
2025-01-14 15:32:14 -05:00
addFrom.RemoveBucket(key);
2020-12-10 14:47:38 -08:00
}
// Now remove the file dictionary from the source DAT
if (delete)
2024-03-19 18:40:24 -04:00
addFrom.ResetDictionary();
2020-12-10 14:47:38 -08:00
}
2021-02-02 14:09:49 -08:00
2024-03-20 00:36:47 -04:00
/// <summary>
/// Add items from another DatFile to the existing DatFile
/// </summary>
/// <param name="addTo">DatFile to add to</param>
/// <param name="addFrom">DatFile to add from</param>
/// <param name="delete">If items should be deleted from the source DatFile</param>
private static void AddFromExistingDB(DatFile addTo, DatFile addFrom, bool delete = false)
{
// Get all current items, machines, and mappings
var datItems = addFrom.ItemsDB.GetItems();
var machines = addFrom.GetMachinesDB();
var sources = addFrom.ItemsDB.GetSources();
var itemMachineMappings = addFrom.ItemsDB.GetItemMachineMappings();
var itemSourceMappings = addFrom.ItemsDB.GetItemSourceMappings();
2024-03-20 00:36:47 -04:00
2024-03-20 01:29:59 -04:00
// Create mappings from old index to new index
2024-03-20 00:36:47 -04:00
var machineRemapping = new Dictionary<long, long>();
2024-03-20 01:29:59 -04:00
var sourceRemapping = new Dictionary<long, long>();
// Loop through and add all sources
foreach (var source in sources)
{
long newSourceIndex = addTo.AddSourceDB(source.Value);
2024-03-20 01:29:59 -04:00
sourceRemapping[source.Key] = newSourceIndex;
}
2024-03-20 00:36:47 -04:00
// Loop through and add all machines
foreach (var machine in machines)
{
long newMachineIndex = addTo.AddMachineDB(machine.Value);
2024-03-20 00:36:47 -04:00
machineRemapping[machine.Key] = newMachineIndex;
}
// Loop through and add the items
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.ForEach(datItems, Core.Globals.ParallelOptions, item =>
2024-03-20 00:36:47 -04:00
#elif NET40_OR_GREATER
Parallel.ForEach(datItems, item =>
#else
foreach (var item in datItems)
#endif
{
2024-03-20 01:29:59 -04:00
// Get the machine and source index for this item
long machineIndex = itemMachineMappings[item.Key];
long sourceIndex = itemSourceMappings[item.Key];
addTo.AddItemDB(item.Value, machineRemapping[machineIndex], sourceRemapping[sourceIndex], statsOnly: false);
2024-03-20 00:36:47 -04:00
// Now remove the key from the source DAT
if (delete)
addFrom.ItemsDB.RemoveItem(item.Key);
#if NET40_OR_GREATER || NETCOREAPP
});
#else
}
#endif
// Now remove the file dictionary from the source DAT
if (delete)
addFrom.ResetDictionary();
}
2021-02-02 14:09:49 -08:00
/// <summary>
/// Fill a DatFile with all items with a particular source index ID
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="indexDat">DatFile to add found items to</param>
/// <param name="index">Source index ID to retrieve items for</param>
/// <returns>DatFile containing all items with the source index ID/returns>
private static void FillWithSourceIndex(DatFile datFile, DatFile indexDat, int index)
{
// Loop through and add the items for this index to the output
2024-02-28 22:54:56 -05:00
#if NET452_OR_GREATER || NETCOREAPP
2025-01-14 15:32:14 -05:00
Parallel.ForEach(datFile.Items.SortedKeys, Core.Globals.ParallelOptions, key =>
2024-02-28 22:54:56 -05:00
#elif NET40_OR_GREATER
2025-01-14 15:32:14 -05:00
Parallel.ForEach(datFile.Items.SortedKeys, key =>
2024-02-28 22:54:56 -05:00
#else
2025-01-14 15:32:14 -05:00
foreach (var key in datFile.Items.SortedKeys)
2024-02-28 22:54:56 -05:00
#endif
2021-02-02 14:09:49 -08:00
{
List<DatItem> items = Merge(datFile.GetItemsForBucket(key));
2021-02-02 14:09:49 -08:00
// If the rom list is empty or null, just skip it
if (items == null || items.Count == 0)
2024-02-29 00:14:16 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2021-02-02 14:09:49 -08:00
return;
2024-02-29 00:14:16 -05:00
#else
continue;
#endif
2021-02-02 14:09:49 -08:00
foreach (DatItem item in items)
{
var source = item.GetFieldValue<Source?>(DatItem.SourceKey);
if (source != null && source.Index == index)
2025-01-14 15:32:14 -05:00
indexDat.AddItem(item, statsOnly: false);
2021-02-02 14:09:49 -08:00
}
2024-02-28 21:59:13 -05:00
#if NET40_OR_GREATER || NETCOREAPP
2021-02-02 14:09:49 -08:00
});
2024-02-28 21:59:13 -05:00
#else
}
2024-03-20 00:36:47 -04:00
#endif
}
/// <summary>
/// Fill a DatFile with all items with a particular source index ID
/// </summary>
/// <param name="datFile">Current DatFile object to use for updating</param>
/// <param name="indexDat">DatFile to add found items to</param>
/// <param name="index">Source index ID to retrieve items for</param>
/// <returns>DatFile containing all items with the source index ID/returns>
private static void FillWithSourceIndexDB(DatFile datFile, DatFile indexDat, int index)
{
// Get all current items, machines, and mappings
var datItems = datFile.ItemsDB.GetItems();
var machines = datFile.GetMachinesDB();
var sources = datFile.ItemsDB.GetSources();
var itemMachineMappings = datFile.ItemsDB.GetItemMachineMappings();
var itemSourceMappings = datFile.ItemsDB.GetItemSourceMappings();
2024-03-20 00:36:47 -04:00
2024-03-20 01:29:59 -04:00
// Create mappings from old index to new index
2024-03-20 00:36:47 -04:00
var machineRemapping = new Dictionary<long, long>();
2024-03-20 01:29:59 -04:00
var sourceRemapping = new Dictionary<long, long>();
// Loop through and add all sources
foreach (var source in sources)
{
long newSourceIndex = indexDat.AddSourceDB(source.Value);
2024-03-20 01:29:59 -04:00
sourceRemapping[source.Key] = newSourceIndex;
}
2024-03-20 00:36:47 -04:00
// Loop through and add all machines
foreach (var machine in machines)
{
long newMachineIndex = indexDat.AddMachineDB(machine.Value);
2024-03-20 00:36:47 -04:00
machineRemapping[machine.Key] = newMachineIndex;
}
// Loop through and add the items
#if NET452_OR_GREATER || NETCOREAPP
2024-10-24 05:58:03 -04:00
Parallel.ForEach(datItems, Core.Globals.ParallelOptions, item =>
2024-03-20 00:36:47 -04:00
#elif NET40_OR_GREATER
Parallel.ForEach(datItems, item =>
#else
foreach (var item in datItems)
#endif
{
2024-03-20 01:29:59 -04:00
// Get the machine and source index for this item
long machineIndex = itemMachineMappings[item.Key];
long sourceIndex = itemSourceMappings[item.Key];
2024-03-20 00:36:47 -04:00
// Get the source associated with the item
var source = datFile.ItemsDB.GetSource(sourceIndex);
if (source != null && source.Index == index)
indexDat.AddItemDB(item.Value, machineRemapping[machineIndex], sourceRemapping[sourceIndex], statsOnly: false);
2024-03-20 00:36:47 -04:00
#if NET40_OR_GREATER || NETCOREAPP
});
#else
}
2024-02-28 21:59:13 -05:00
#endif
2021-02-02 14:09:49 -08:00
}
#endregion
2020-12-10 10:39:39 -08:00
}
}