|
|
|
@ -6,6 +6,7 @@ using Serilog;
|
|
|
|
|
using Serilog.Events;
|
|
|
|
|
using MurmurHash.Net;
|
|
|
|
|
using Standart.Hash.xxHash;
|
|
|
|
|
using StackExchange.Redis;
|
|
|
|
|
|
|
|
|
|
namespace Chksum.Utils;
|
|
|
|
|
public class ChksumUtils {
|
|
|
|
@ -52,7 +53,7 @@ public class ChksumUtils {
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public void initializeDB() {
|
|
|
|
|
private void initializeDB() {
|
|
|
|
|
if (File.Exists("chksum.db")) {
|
|
|
|
|
logger.Information("A database already exits");
|
|
|
|
|
return;
|
|
|
|
@ -73,6 +74,14 @@ public class ChksumUtils {
|
|
|
|
|
);
|
|
|
|
|
";
|
|
|
|
|
command.ExecuteNonQuery();
|
|
|
|
|
|
|
|
|
|
var walCommand = connection.CreateCommand();
|
|
|
|
|
walCommand.CommandText =
|
|
|
|
|
@"
|
|
|
|
|
PRAGMA journal_mode = 'wal'
|
|
|
|
|
";
|
|
|
|
|
walCommand.ExecuteNonQuery();
|
|
|
|
|
|
|
|
|
|
logger.Information("Database was successfully created");
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
@ -89,9 +98,19 @@ public class ChksumUtils {
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private void UpdateProgressBar(int current, int total) {
|
|
|
|
|
int progress = (int)((double)current / total * 100);
|
|
|
|
|
string progressText = $"Progress: {progress}% [{current}/{total}]";
|
|
|
|
|
|
|
|
|
|
Console.Write("\r" + progressText.PadRight(Console.WindowWidth));
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private Dictionary<string, string> CalculateChecksums(string[] filenames) {
|
|
|
|
|
ConcurrentDictionary<string, string> checksums = new ConcurrentDictionary<string, string>();
|
|
|
|
|
|
|
|
|
|
int totalFiles = filenames.Length;
|
|
|
|
|
int processedFiles = 0;
|
|
|
|
|
|
|
|
|
|
Parallel.ForEach(filenames, (filename, state) => {
|
|
|
|
|
using (var md5 = MD5.Create()) {
|
|
|
|
|
using (var stream = File.OpenRead(filename)) {
|
|
|
|
@ -102,31 +121,36 @@ public class ChksumUtils {
|
|
|
|
|
checksums.TryAdd(filename, checksum);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
Interlocked.Increment(ref processedFiles);
|
|
|
|
|
UpdateProgressBar(processedFiles, totalFiles);
|
|
|
|
|
}
|
|
|
|
|
});
|
|
|
|
|
|
|
|
|
|
logger.Debug("All files were checksummed");
|
|
|
|
|
return new Dictionary<string, string>(checksums);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private Dictionary<string, uint> CalculateChecksumsWithMurmur(string[] filenames) {
|
|
|
|
|
private Dictionary<string, uint> CalculateChecksumsWithMurmur(string[] filenames, int userDefinedBufferSize) {
|
|
|
|
|
ConcurrentDictionary<string, uint> checksums = new ConcurrentDictionary<string, uint>();
|
|
|
|
|
|
|
|
|
|
int totalFiles = filenames.Length;
|
|
|
|
|
int processedFiles = 0;
|
|
|
|
|
|
|
|
|
|
Parallel.ForEach(filenames, (filename, state) => {
|
|
|
|
|
using (var stream = File.OpenRead(filename)) {
|
|
|
|
|
var hash = CalculateMurmurHash32(stream);
|
|
|
|
|
var hash = CalculateMurmurHash32(stream, userDefinedBufferSize);
|
|
|
|
|
lock (checksums) {
|
|
|
|
|
checksums.TryAdd(filename, hash);
|
|
|
|
|
}
|
|
|
|
|
Interlocked.Increment(ref processedFiles);
|
|
|
|
|
UpdateProgressBar(processedFiles, totalFiles);
|
|
|
|
|
}
|
|
|
|
|
});
|
|
|
|
|
|
|
|
|
|
logger.Debug("All files were checksummed");
|
|
|
|
|
return new Dictionary<string, uint>(checksums);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private uint CalculateMurmurHash32(Stream stream) {
|
|
|
|
|
const int bufferSize = 4096;
|
|
|
|
|
private uint CalculateMurmurHash32(Stream stream, int userDefinedBufferSize) {
|
|
|
|
|
int bufferSize = userDefinedBufferSize;
|
|
|
|
|
const uint seed = 123456U;
|
|
|
|
|
|
|
|
|
|
var buffer = new byte[bufferSize];
|
|
|
|
@ -141,21 +165,26 @@ public class ChksumUtils {
|
|
|
|
|
return hash;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private Dictionary<string, ulong> CalculateChecksumsWithXxHash3(string[] filenames) {
|
|
|
|
|
private Dictionary<string, ulong> CalculateChecksumsWithXxHash3(string[] filenames, int userDefinedBufferSize) {
|
|
|
|
|
ConcurrentDictionary<string, ulong> checksums = new ConcurrentDictionary<string, ulong>();
|
|
|
|
|
|
|
|
|
|
int totalFiles = filenames.Length;
|
|
|
|
|
int processedFiles = 0;
|
|
|
|
|
|
|
|
|
|
Parallel.ForEach(filenames, (filename, state) => {
|
|
|
|
|
using (var stream = File.OpenRead(filename)) {
|
|
|
|
|
var hash = CalculateXxHash3(stream);
|
|
|
|
|
var hash = CalculateXxHash3(stream, userDefinedBufferSize);
|
|
|
|
|
checksums.TryAdd(filename, hash);
|
|
|
|
|
}
|
|
|
|
|
Interlocked.Increment(ref processedFiles);
|
|
|
|
|
UpdateProgressBar(processedFiles, totalFiles);
|
|
|
|
|
});
|
|
|
|
|
|
|
|
|
|
return new Dictionary<string, ulong>(checksums);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private ulong CalculateXxHash3(Stream stream) {
|
|
|
|
|
const int bufferSize = 4096;
|
|
|
|
|
private ulong CalculateXxHash3(Stream stream, int userDefinedBufferSize) {
|
|
|
|
|
int bufferSize = userDefinedBufferSize;
|
|
|
|
|
const ulong seed = 123456U;
|
|
|
|
|
|
|
|
|
|
var buffer = new byte[bufferSize];
|
|
|
|
@ -170,63 +199,95 @@ public class ChksumUtils {
|
|
|
|
|
return hash;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public void doTheThing(string hashalgo, int bufferSize = 4096) {
|
|
|
|
|
|
|
|
|
|
ConnectionMultiplexer redis = ConnectionMultiplexer.Connect("localhost");
|
|
|
|
|
IDatabase db = redis.GetDatabase();
|
|
|
|
|
|
|
|
|
|
if (getTotalFileCount() < 1) {
|
|
|
|
|
logger.Information("There were no files to checksum");
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
Dictionary<string, object> fileHashes;
|
|
|
|
|
Dictionary<string, ulong> fileHashesXxHash3;
|
|
|
|
|
Dictionary<string, uint> fileHashesMurmur;
|
|
|
|
|
Dictionary<string, string> fileHashesMD5;
|
|
|
|
|
|
|
|
|
|
switch (hashalgo) {
|
|
|
|
|
case "MD5":
|
|
|
|
|
fileHashesMD5 = CalculateChecksums(indexFiles());
|
|
|
|
|
fileHashes = fileHashesMD5.ToDictionary(kv => kv.Key, kv => (object)kv.Value);
|
|
|
|
|
break;
|
|
|
|
|
case "Murmur":
|
|
|
|
|
fileHashesMurmur = CalculateChecksumsWithMurmur(indexFiles(), bufferSize);
|
|
|
|
|
fileHashes = fileHashesMurmur.ToDictionary(kv => kv.Key, kv => (object)kv.Value);
|
|
|
|
|
break;
|
|
|
|
|
case "XxHash":
|
|
|
|
|
fileHashesXxHash3 = CalculateChecksumsWithXxHash3(indexFiles(), bufferSize);
|
|
|
|
|
fileHashes = fileHashesXxHash3.ToDictionary(kv => kv.Key, kv => (object)kv.Value);
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
logger.Error("No valid hash algorithm was selected");
|
|
|
|
|
throw new Exception($"{hashalgo} is not a valid option. Valid options are MD5, Murmur and XxHash");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
logger.Information("All files were checksummed");
|
|
|
|
|
|
|
|
|
|
HashEntry[] hashEntries = fileHashes.Select(kv => new HashEntry(kv.Key, kv.Value.ToString())).ToArray();
|
|
|
|
|
string hashKey = "fileHashes";
|
|
|
|
|
db.HashSet(hashKey, hashEntries);
|
|
|
|
|
logger.Information("Dictionary inserted into Redis.");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public void saveToSqlite() {
|
|
|
|
|
|
|
|
|
|
initializeDB();
|
|
|
|
|
|
|
|
|
|
ConnectionMultiplexer redis = ConnectionMultiplexer.Connect("localhost");
|
|
|
|
|
IDatabase db = redis.GetDatabase();
|
|
|
|
|
|
|
|
|
|
HashEntry[] fileHashes = db.HashGetAll("fileHashes");
|
|
|
|
|
logger.Information("Retrived all values from redis");
|
|
|
|
|
|
|
|
|
|
public void doTheThing(string hashalgo, int bufferSize) {
|
|
|
|
|
using (var connection = new SqliteConnection("Data Source=" + DatabaseRoot + "chksum.db;Mode=ReadWrite")) {
|
|
|
|
|
if (getTotalFileCount() < 1) {
|
|
|
|
|
logger.Information("There were no files to checksum");
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
connection.Open();
|
|
|
|
|
|
|
|
|
|
Dictionary<string, object> fileHashes;
|
|
|
|
|
Dictionary<string, ulong> fileHashesXxHash3;
|
|
|
|
|
Dictionary<string, uint> fileHashesMurmur;
|
|
|
|
|
Dictionary<string, string> fileHashesMD5;
|
|
|
|
|
|
|
|
|
|
switch (hashalgo) {
|
|
|
|
|
case "MD5":
|
|
|
|
|
fileHashesMD5 = CalculateChecksums(indexFiles());
|
|
|
|
|
fileHashes = fileHashesMD5.ToDictionary(kv => kv.Key, kv => (object)kv.Value);
|
|
|
|
|
break;
|
|
|
|
|
case "Murmur":
|
|
|
|
|
fileHashesMurmur = CalculateChecksumsWithMurmur(indexFiles());
|
|
|
|
|
fileHashes = fileHashesMurmur.ToDictionary(kv => kv.Key, kv => (object)kv.Value);
|
|
|
|
|
break;
|
|
|
|
|
case "XxHash":
|
|
|
|
|
fileHashesXxHash3 = CalculateChecksumsWithXxHash3(indexFiles());
|
|
|
|
|
fileHashes = fileHashesXxHash3.ToDictionary(kv => kv.Key, kv => (object)kv.Value);
|
|
|
|
|
break;
|
|
|
|
|
default:
|
|
|
|
|
logger.Error("No valid hash algorithm was selected");
|
|
|
|
|
throw new Exception($"{hashalgo} is not a valid option. Valid options are MD5, Murmur and XxHash");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
foreach (var file in fileHashes) {
|
|
|
|
|
string absolutePathToFile = file.Key;
|
|
|
|
|
string fileName = Path.GetFileName(absolutePathToFile);
|
|
|
|
|
string pathToFile = Path.GetRelativePath(DatabaseRoot, absolutePathToFile);
|
|
|
|
|
var fileHash = file.Value;
|
|
|
|
|
|
|
|
|
|
if (checkIfFileMovedAndUpdatePathToFile(fileHash, fileName, pathToFile) == false && checkIfFileAlreadyExistsInDatabase(fileHash, fileName) == false) {
|
|
|
|
|
var command = connection.CreateCommand();
|
|
|
|
|
command.CommandText =
|
|
|
|
|
var absolutePathToFile = file.Name.ToString();
|
|
|
|
|
string fileName = Path.GetFileName(absolutePathToFile.ToString());
|
|
|
|
|
string pathToFile = Path.GetRelativePath(DatabaseRoot, absolutePathToFile.ToString());
|
|
|
|
|
var fileHash = file.Value.ToString();
|
|
|
|
|
|
|
|
|
|
if (!checkIfFileMovedAndUpdatePathToFile(fileHash, fileName, pathToFile) && !checkIfFileAlreadyExistsInDatabase(fileHash, fileName)) {
|
|
|
|
|
connection.Open();
|
|
|
|
|
var InsertCommand = connection.CreateCommand();
|
|
|
|
|
InsertCommand.CommandText =
|
|
|
|
|
@"
|
|
|
|
|
INSERT INTO file (filehash, filename, pathtofile)
|
|
|
|
|
VALUES ($filehash, $filename, $pathtofile)
|
|
|
|
|
";
|
|
|
|
|
command.Parameters.AddWithValue("$filehash", fileHash);
|
|
|
|
|
command.Parameters.AddWithValue("$filename", fileName);
|
|
|
|
|
command.Parameters.AddWithValue("$pathtofile", pathToFile);
|
|
|
|
|
command.ExecuteNonQuery();
|
|
|
|
|
InsertCommand.Parameters.AddWithValue("$filehash", fileHash);
|
|
|
|
|
InsertCommand.Parameters.AddWithValue("$filename", fileName);
|
|
|
|
|
InsertCommand.Parameters.AddWithValue("$pathtofile", pathToFile);
|
|
|
|
|
InsertCommand.ExecuteNonQuery();
|
|
|
|
|
logger.Verbose("{fileName} which is located at {pathToFile} relative to the database with the hash {fileHash} was successfully inserted into the database", fileName, pathToFile, fileHash);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
logger.Information("All files were successfully written to the database");
|
|
|
|
|
}
|
|
|
|
|
logger.Information("All filehashes were successfully inserted into the database");
|
|
|
|
|
|
|
|
|
|
var keys = db.Execute("KEYS", "*");
|
|
|
|
|
if (keys == null) {
|
|
|
|
|
logger.Error("No values found in redis");
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
foreach (var key in (RedisValue[])keys) {
|
|
|
|
|
db.KeyDelete((RedisKey)key.ToString());
|
|
|
|
|
}
|
|
|
|
|
logger.Information("Redis was successfully cleared of any remaining data");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private bool checkIfFileAlreadyExistsInDatabase(object fileHash, string pathToFile) {
|
|
|
|
|
private bool checkIfFileAlreadyExistsInDatabase(string fileHash, string pathToFile) {
|
|
|
|
|
string filehash = string.Empty;
|
|
|
|
|
string pathtofile = string.Empty;
|
|
|
|
|
bool doesExist = false;
|
|
|
|
@ -239,7 +300,7 @@ public class ChksumUtils {
|
|
|
|
|
@"
|
|
|
|
|
SELECT filehash, pathtofile FROM file WHERE filehash = $filehash
|
|
|
|
|
";
|
|
|
|
|
command.Parameters.AddWithValue("$filehash", fileHash.ToString());
|
|
|
|
|
command.Parameters.AddWithValue("$filehash", fileHash);
|
|
|
|
|
|
|
|
|
|
using (var reader = command.ExecuteReader()) {
|
|
|
|
|
while (reader.Read()) {
|
|
|
|
@ -247,17 +308,17 @@ public class ChksumUtils {
|
|
|
|
|
pathtofile = reader.GetString(1);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
logger.Verbose("{pathToFile} with the hash {fileHash} was successfully loaded", pathToFile, fileHash.ToString());
|
|
|
|
|
logger.Verbose("{pathToFile} with the hash {fileHash} was successfully loaded", pathToFile, fileHash);
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if (fileHash.ToString() == filehash) {
|
|
|
|
|
if (fileHash == filehash) {
|
|
|
|
|
logger.Verbose("File with filehash {filehash} already exists in the database", filehash);
|
|
|
|
|
doesExist = true;
|
|
|
|
|
}
|
|
|
|
|
return doesExist;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
private bool checkIfFileMovedAndUpdatePathToFile(object fileHash, string fileName, string pathToFile) {
|
|
|
|
|
private bool checkIfFileMovedAndUpdatePathToFile(string fileHash, string fileName, string pathToFile) {
|
|
|
|
|
string pathtofile = string.Empty;
|
|
|
|
|
bool wasMoved = false;
|
|
|
|
|
|
|
|
|
@ -269,7 +330,7 @@ public class ChksumUtils {
|
|
|
|
|
@"
|
|
|
|
|
SELECT pathtofile FROM file WHERE filehash = $filehash
|
|
|
|
|
";
|
|
|
|
|
command.Parameters.AddWithValue("$filehash", fileHash.ToString());
|
|
|
|
|
command.Parameters.AddWithValue("$filehash", fileHash);
|
|
|
|
|
|
|
|
|
|
using (var reader = command.ExecuteReader()) {
|
|
|
|
|
while (reader.Read()) {
|
|
|
|
@ -286,20 +347,21 @@ public class ChksumUtils {
|
|
|
|
|
WHERE filehash = $filehash
|
|
|
|
|
";
|
|
|
|
|
command2.Parameters.AddWithValue("$newpathtofile", pathToFile);
|
|
|
|
|
command2.Parameters.AddWithValue("$filehash", fileHash.ToString());
|
|
|
|
|
command2.Parameters.AddWithValue("$filehash", fileHash);
|
|
|
|
|
command2.ExecuteNonQuery();
|
|
|
|
|
|
|
|
|
|
//Console.WriteLine("File moved or is a duplicate:");
|
|
|
|
|
//Console.WriteLine($"\tfrom\t{pathToFile}");
|
|
|
|
|
//Console.WriteLine($"\tto \t{pathtofile}\n");
|
|
|
|
|
logger.Verbose("File moved or is a duplicate:\n\tfrom\t{pathToFile}\n\tto \t{pathtofile}\n", pathToFile, pathtofile);
|
|
|
|
|
wasMoved = true;
|
|
|
|
|
}
|
|
|
|
|
logger.Verbose("{fileName} which is located at {pathToFile} relative to the database with the hash {fileHash} was successfully checked", fileName, pathToFile, fileHash.ToString());
|
|
|
|
|
logger.Verbose("{fileName} which is located at {pathToFile} relative to the database with the hash {fileHash} was successfully checked", fileName, pathToFile, fileHash);
|
|
|
|
|
}
|
|
|
|
|
return wasMoved;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public void checkIfFileWasDeleted() {
|
|
|
|
|
|
|
|
|
|
saveToSqlite();
|
|
|
|
|
|
|
|
|
|
string pathToFile = string.Empty;
|
|
|
|
|
|
|
|
|
|
using (var connection = new SqliteConnection("Data Source=" + DatabaseRoot + "chksum.db;Mode=ReadWrite")) {
|
|
|
|
@ -328,9 +390,7 @@ public class ChksumUtils {
|
|
|
|
|
deleteCommand.Parameters.AddWithValue("$pathtofile", pathToFile);
|
|
|
|
|
deleteCommand.ExecuteNonQuery();
|
|
|
|
|
|
|
|
|
|
//Console.WriteLine("File deleted:");
|
|
|
|
|
//Console.WriteLine($"\t{pathToFile}\n");
|
|
|
|
|
logger.Information("File deleted: {pathToFile}", pathToFile);
|
|
|
|
|
logger.Information("File deleted:\n\t{pathToFile}", pathToFile);
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
logger.Information("All deleted files were successfully removed from the database");
|
|
|
|
@ -364,6 +424,9 @@ public class ChksumUtils {
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
public void compareDatabases(string filePathToOtherDatabase) {
|
|
|
|
|
|
|
|
|
|
saveToSqlite();
|
|
|
|
|
|
|
|
|
|
if (!File.Exists(filePathToOtherDatabase)) {
|
|
|
|
|
logger.Error("No database could be found at {filePathToOtherDatabase}", filePathToOtherDatabase);
|
|
|
|
|
throw new Exception("No database could be found at " + filePathToOtherDatabase);
|
|
|
|
@ -400,6 +463,6 @@ public class ChksumUtils {
|
|
|
|
|
|
|
|
|
|
public void cleanup() {
|
|
|
|
|
File.Delete(libraryPath);
|
|
|
|
|
logger.Debug("Successfully deleted libe_sqlite3.so");
|
|
|
|
|
logger.Information("Successfully deleted libe_sqlite3.so");
|
|
|
|
|
}
|
|
|
|
|
}
|