using System; using System.Collections.Generic; using System.IO; using System.Linq; using System.Text.RegularExpressions; using Dinah.Core; using Polly; using Polly.Retry; namespace FileManager { public static class FileUtility { /// /// "txt" => ".txt" ///
".txt" => ".txt" ///
null or whitespace => "" ///
public static string GetStandardizedExtension(string extension) => string.IsNullOrWhiteSpace(extension) ? (extension ?? "")?.Trim() : '.' + extension.Trim().Trim('.'); /// /// Return position with correct number of leading zeros. ///
- 2 of 9 => "2" ///
- 2 of 90 => "02" ///
- 2 of 900 => "002" ///
/// position in sequence. The 'x' in 'x of y' /// total qty in sequence. The 'y' in 'x of y' public static string GetSequenceFormatted(int position, int total) { ArgumentValidator.EnsureGreaterThan(position, nameof(position), 0); ArgumentValidator.EnsureGreaterThan(total, nameof(total), 0); if (position > total) throw new ArgumentException($"{position} may not be greater than {total}"); return position.ToString().PadLeft(total.ToString().Length, '0'); } /// /// Ensure valid file name path: ///
- remove invalid chars ///
- ensure uniqueness ///
- enforce max file length ///
public static LongPath GetValidFilename(LongPath path, ReplacementCharacters replacements, bool returnFirstExisting = false) { ArgumentValidator.EnsureNotNull(path, nameof(path)); // remove invalid chars path = GetSafePath(path, replacements); // ensure uniqueness and check lengths var dir = Path.GetDirectoryName(path); dir = dir?.Truncate(LongPath.MaxDirectoryLength) ?? string.Empty; var extension = Path.GetExtension(path); var filename = Path.GetFileNameWithoutExtension(path).Truncate(LongPath.MaxFilenameLength - extension.Length); var fileStem = Path.Combine(dir, filename); var fullfilename = fileStem.Truncate(LongPath.MaxPathLength - extension.Length) + extension; fullfilename = removeInvalidWhitespace(fullfilename); var i = 0; while (File.Exists(fullfilename) && !returnFirstExisting) { var increm = $" ({++i})"; fullfilename = fileStem.Truncate(LongPath.MaxPathLength - increm.Length - extension.Length) + increm + extension; } return fullfilename; } /// Use with full path, not file name. Valid path characters which are invalid file name characters will be retained: '\\', '/' public static LongPath GetSafePath(LongPath path, ReplacementCharacters replacements) { ArgumentValidator.EnsureNotNull(path, nameof(path)); var pathNoPrefix = path.PathWithoutPrefix; pathNoPrefix = replaceInvalidChars(pathNoPrefix, replacements); pathNoPrefix = removeDoubleSlashes(pathNoPrefix); return pathNoPrefix; } public static char[] invalidChars { get; } = Path.GetInvalidPathChars().Union(new[] { '*', '?', ':', // these are weird. If you run Path.GetInvalidPathChars() in Visual Studio's "C# Interactive", then these characters are included. // In live code, Path.GetInvalidPathChars() does not include them '"', '<', '>' }).ToArray(); private static string replaceInvalidChars(string path, ReplacementCharacters replacements) { // replace all colons except within the first 2 chars var builder = new System.Text.StringBuilder(); for (var i = 0; i < path.Length; i++) { var c = path[i]; if (!invalidChars.Contains(c) || (i <= 2 && Path.IsPathRooted(path))) builder.Append(c); else { char preceding = i > 0 ? path[i - 1] : default; char succeeding = i < path.Length - 1 ? path[i + 1] : default; builder.Append(replacements.GetReplacement(c, preceding, succeeding)); } } return builder.ToString(); } private static string removeDoubleSlashes(string path) { if (path.Length < 2) return path; // exception: don't try to condense the initial dbl bk slashes in a path. eg: \\192.168.0.1 var remainder = path[1..]; var dblSeparator = $"{Path.DirectorySeparatorChar}{Path.DirectorySeparatorChar}"; while (remainder.Contains(dblSeparator)) remainder = remainder.Replace(dblSeparator, $"{Path.DirectorySeparatorChar}"); return path[0] + remainder; } private static string removeInvalidWhitespace_pattern { get; } = $@"[\s\.]*\{Path.DirectorySeparatorChar}\s*"; private static Regex removeInvalidWhitespace_regex { get; } = new(removeInvalidWhitespace_pattern, RegexOptions.Compiled | RegexOptions.IgnorePatternWhitespace); /// no part of the path may begin or end in whitespace private static string removeInvalidWhitespace(string fullfilename) { // no whitespace at beginning or end // replace whitespace around path slashes // regex (with space added for clarity) // \s* \\ \s* => \ // no ending dots. beginning dots are valid // regex is easier by ending with separator fullfilename += Path.DirectorySeparatorChar; fullfilename = removeInvalidWhitespace_regex.Replace(fullfilename, Path.DirectorySeparatorChar.ToString()); // take separator back off fullfilename = RemoveLastCharacter(fullfilename); fullfilename = removeDoubleSlashes(fullfilename); return fullfilename; } public static string RemoveLastCharacter(this string str) => string.IsNullOrEmpty(str) ? str : str[..^1]; /// /// Move file. ///
- Ensure valid file name path: remove invalid chars, ensure uniqueness, enforce max file length ///
- Perform ///
- Return valid path ///
public static string SaferMoveToValidPath(LongPath source, LongPath destination, ReplacementCharacters replacements) { destination = GetValidFilename(destination, replacements); SaferMove(source, destination); return destination; } private static int maxRetryAttempts { get; } = 3; private static TimeSpan pauseBetweenFailures { get; } = TimeSpan.FromMilliseconds(100); private static RetryPolicy retryPolicy { get; } = Policy .Handle() .WaitAndRetry(maxRetryAttempts, i => pauseBetweenFailures); /// Delete file. No error when source does not exist. Retry up to 3 times before throwing exception. public static void SaferDelete(LongPath source) => retryPolicy.Execute(() => { try { if (!File.Exists(source)) { Serilog.Log.Logger.Debug("No file to delete: {@DebugText}", new { source }); return; } Serilog.Log.Logger.Debug("Attempt to delete file: {@DebugText}", new { source }); File.Delete(source); Serilog.Log.Logger.Information("File successfully deleted: {@DebugText}", new { source }); } catch (Exception e) { Serilog.Log.Logger.Error(e, "Failed to delete file: {@DebugText}", new { source }); throw; } }); /// Move file. No error when source does not exist. Retry up to 3 times before throwing exception. public static void SaferMove(LongPath source, LongPath destination) => retryPolicy.Execute(() => { try { if (!File.Exists(source)) { Serilog.Log.Logger.Debug("No file to move: {@DebugText}", new { source }); return; } SaferDelete(destination); var dir = Path.GetDirectoryName(destination); Serilog.Log.Logger.Debug("Attempt to create directory: {@DebugText}", new { dir }); Directory.CreateDirectory(dir); Serilog.Log.Logger.Debug("Attempt to move file: {@DebugText}", new { source, destination }); File.Move(source, destination); Serilog.Log.Logger.Information("File successfully moved: {@DebugText}", new { source, destination }); } catch (Exception e) { Serilog.Log.Logger.Error(e, "Failed to move file: {@DebugText}", new { source, destination }); throw; } }); /// /// A safer way to get all the files in a directory and sub directory without crashing on UnauthorizedException or PathTooLongException /// /// Starting directory /// Filename pattern match /// Search subdirectories or only top level directory for files /// List of files public static IEnumerable SaferEnumerateFiles(LongPath path, string searchPattern = "*", SearchOption searchOption = SearchOption.TopDirectoryOnly) { var foundFiles = Enumerable.Empty(); if (searchOption == SearchOption.AllDirectories) { try { IEnumerable subDirs = Directory.EnumerateDirectories(path).Select(p => (LongPath)p); // Add files in subdirectories recursively to the list foreach (string dir in subDirs) foundFiles = foundFiles.Concat(SaferEnumerateFiles(dir, searchPattern, searchOption)); } catch (UnauthorizedAccessException) { } catch (PathTooLongException) { } } try { // Add files from the current directory foundFiles = foundFiles.Concat(Directory.EnumerateFiles(path, searchPattern).Select(f => (LongPath)f)); } catch (UnauthorizedAccessException) { } return foundFiles; } } }