From 4f9160461e2d09c30029a70f9ffdacb6a697156b Mon Sep 17 00:00:00 2001 From: Tangent Date: Thu, 23 May 2024 20:57:51 -0600 Subject: [PATCH] dealing with uniquitity weirdly --- unique-file-names.lua | 56 ++++++++++++++++++++++++++++++++++ unique-file-paths.lua | 70 +++++++++++++++++++++++++++++++++++++++++++ unique-files.lua | 5 ++-- 3 files changed, 128 insertions(+), 3 deletions(-) create mode 100644 unique-file-names.lua create mode 100644 unique-file-paths.lua diff --git a/unique-file-names.lua b/unique-file-names.lua new file mode 100644 index 0000000..89cf749 --- /dev/null +++ b/unique-file-names.lua @@ -0,0 +1,56 @@ +#!/usr/bin/env luajit + +-- Partially written by ChatGPT using GPT-3.5, with corrections and modifications by me. +-- Do whatever the hell you want with it. + +local lfs = require "lfs" + +-- Function to recursively traverse directories, get file paths +local function traverse_directory(path) + local files = {} + + for entry in lfs.dir(path) do + if entry ~= "." and entry ~= ".." then + local full_path = path..'\\'..entry + local attributes = lfs.attributes(full_path) + + if attributes and attributes.mode == "file" then + files[path] = true + + elseif attributes and attributes.mode == "directory" then + local subdir_files = traverse_directory(full_path) + for path in pairs(subdir_files) do + files[path] = true + end + end + end + end + + return files +end + + + +local paths = {} -- becomes a hashtable of hashtables of full_path = true +for _, path in ipairs(arg) do + -- powershell handles quotes, so I assume each argument is a full valid path + paths[path] = traverse_directory(path) +end + +local file_names = {} -- a hashtable of unique file names, numerical values indicating how many times the file name exists +for path_start, full_path_table in pairs(paths) do + for path in pairs(full_path_table) do + local current_name = path:match("^[.+\\]*(.+)$") -- not sure if this is correct :D + if file_names[current_name] then + file_names[current_name] = file_names[current_name] + 1 + else + file_names[current_name] = 1 + end + end +end + +for current_name, occurrences in pairs(file_names) do + if occurrences ~= 1 then + print(current_name .. " occurs " .. occurrences .. " times!") + end +end diff --git a/unique-file-paths.lua b/unique-file-paths.lua new file mode 100644 index 0000000..be59ccf --- /dev/null +++ b/unique-file-paths.lua @@ -0,0 +1,70 @@ +#!/usr/bin/env luajit + +-- Partially written by ChatGPT using GPT-3.5, with corrections and modifications by me. +-- Do whatever the hell you want with it. + +-- Note: For some reason, "." is always detected as a duplicated path in all directories selected. + +local lfs = require "lfs" + +-- Function to recursively traverse directories, get file paths +local function traverse_directory(path) + local files = {} + + for entry in lfs.dir(path) do + if entry ~= "." and entry ~= ".." then + local full_path = path..'\\'..entry + local attributes = lfs.attributes(full_path) + + if attributes and attributes.mode == "file" then + files[path] = true + + elseif attributes and attributes.mode == "directory" then + local subdir_files = traverse_directory(full_path) + for path in pairs(subdir_files) do + files[path] = true + end + end + end + end + + return files +end + + + +local paths = {} -- becomes a hashtable of hashtables of full_path = true +for _, path in ipairs(arg) do + -- powershell handles quotes, so I assume each argument is a full valid path + paths[path] = traverse_directory(path) +end + +local subpaths = {} -- a hashtable of all unique subpaths +for path_start, full_path_table in pairs(paths) do + for path in pairs(full_path_table) do + local local_path = "." .. path:sub(#path_start + 1) + subpaths[local_path] = true + end +end + +for subpath in pairs(subpaths) do + local known_paths = {} + local paths_found = 0 + for path_start, full_path_table in pairs(paths) do + local global_path = path_start .. subpath:sub(2) + if full_path_table[global_path] then + paths_found = paths_found + 1 + known_paths[global_path] = true + end + end + if paths_found == 1 then + -- print("UNIQUE: " .. next(known_paths)) + local _ = nil + else + local output_text = {} + for global_path in pairs(known_paths) do + table.insert(output_text, global_path) + end + print(subpath .. " exists " .. paths_found .." times!\n" .. table.concat(output_text, "\n")) -- the extra \n at the end is kept intentionally + end +end diff --git a/unique-files.lua b/unique-files.lua index b0b3469..3c5dfde 100644 --- a/unique-files.lua +++ b/unique-files.lua @@ -86,9 +86,8 @@ for subpath in pairs(subpaths) do for global_path, size in pairs(sizes) do table.insert(output_text, global_path .. ": " .. size .. " bytes") end - print(subpath .. " has different sizes!\n" .. table.concat(output_text,"\n") .. "\n") + print(subpath .. " has different sizes!\n" .. table.concat(output_text,"\n")) -- the extra \n at the end is kept intentionally elseif paths_checked < 2 then - -- print(subpath .. " is unique!\n" .. next(sizes) .. "\n") - print(next(sizes) .. " is unique!\n") + print("UNIQUE: " .. next(sizes)) end end