321 lines
12 KiB
PowerShell
321 lines
12 KiB
PowerShell
<#
|
|
Script should:
|
|
1) get list of all Project Folders
|
|
2) Determine if there's content in these folders (exlude shortcuts, lnks, single files)
|
|
3) Flag folders with content
|
|
4) Output results to file for each server.
|
|
|
|
Each Output file should be read by the analysis script to determine locations with duplicate data.
|
|
|
|
Output File should show:
|
|
X:\CG | ProjectNumber | FullPath | filecount
|
|
|
|
#>
|
|
|
|
[CmdletBinding()]
|
|
param (
|
|
#refresh all data - causes the DB to be wiped clean and all file folders to be re-analyzed.
|
|
[Parameter(Mandatory = $false)]
|
|
[switch]
|
|
$Refresh
|
|
)
|
|
|
|
#refresh all data - causes the DB to be wiped clean and all file folders to be re-analyzed.
|
|
|
|
$Path_To_Working_copy = "M:\00 - Egnyte PS Data Inventory\Output\MPE Data Inventory - Working.xlsx"
|
|
$PAth_To_Migration_Status = "M:\00 - Egnyte PS Data Inventory\Migration_status\Migration_Health_stat_MPE.xlsx"
|
|
$PathToDB = "M:\IT\Egnyte\DuplicateFiles\WorkingRun\Dedupe.SQLite"
|
|
$OutputFolder = "M:\IT\Egnyte\DuplicateFiles\WorkingRun\Output"
|
|
$BaseDrive = 'X:\'
|
|
$ProjectRegex = '^X:\\[A-Z]{2}\W\d{2}\\\d{2}'
|
|
$OfficeList = Get-ChildItem -Path $BaseDrive -Directory -Depth 0
|
|
|
|
if ($Refresh) {
|
|
# Reset the DB, start fresh
|
|
$DBConnect = New-SqliteConnection -DataSource $PathToDB
|
|
$ClearQuery = 'DELETE FROM FolderData;'
|
|
Invoke-SqliteQuery -DataSource $PathToDB -Query $ClearQuery
|
|
|
|
$DBConnect.close()
|
|
}
|
|
|
|
|
|
|
|
|
|
$OfficeList | ForEach-Object -parallel {
|
|
$PathToDB_Copy_Main = $USING:PathToDB
|
|
$ServerProgress = @{
|
|
ID = 1
|
|
Activity = "Processing: " + $_.FullName
|
|
# PercentComplete = 100
|
|
# CurrentOperation = $_.Project
|
|
}
|
|
Write-Progress @ServerProgress
|
|
#Action that will run in Parallel. Reference the current object via $PSItem and bring in outside variables with $USING:varname
|
|
|
|
$XDrivePath = $_.FullName
|
|
# Write-Host "Processing " $_.FullName -ForegroundColor Green
|
|
$ProjectFolders = get-childitem $_.FullName -Directory -Depth 1 | Where-Object FullName -Match $USING:ProjectRegex
|
|
|
|
# $ProjectFolders now contains all folders down to the 3rd level of project number - for Example, 1234-567-001. We can now generate a project number for the output file.
|
|
# We need to get a file count for each "last" folder - IE, 001 in the example 1234-567-001.
|
|
|
|
$ProjectFolders | ForEach-Object -ThrottleLimit 8 -Parallel {
|
|
$PathToDB_Copy = $USING:PathToDB_Copy_Main
|
|
|
|
$JobID = Get-Random
|
|
$CurentLoopProgress = @{
|
|
ID = $JobID
|
|
Activity = "Analyzing " + $_.FullName
|
|
PercentComplete = 10
|
|
}
|
|
|
|
# Write-Progress @CurentLoopProgress
|
|
|
|
|
|
$projectNumber = ''
|
|
# thank you ChatGPT
|
|
$string = $_.FullName
|
|
$regex = "\\(\d+(-\d+)*)"
|
|
$matches = [regex]::Matches($string, $regex)
|
|
$result = ""
|
|
foreach ($match in $matches) {
|
|
$result += $match.Groups[1].Value
|
|
if ($match.Groups[2].Success) {
|
|
$result += $match.Groups[2].Value
|
|
}
|
|
# if ($match.Groups[3].Success) {
|
|
# $result += $match.Groups[3].Value
|
|
# }
|
|
}
|
|
# / Thank you Chat GPT
|
|
# $result = $result -replace ('-','')
|
|
|
|
|
|
if ($result.Length -lt 5 ) {
|
|
# $CurentLoopProgress = @{
|
|
# ID = $JobID
|
|
# Activity = $_.FullName + " Not a Project"
|
|
# }
|
|
|
|
# Write-Progress @CurentLoopProgress
|
|
}
|
|
elseif ($result.Length -ge 5) {
|
|
$RefreshDays = -15 - (Get-Random -Maximum 5)
|
|
|
|
$Server = $_.FullName.Substring(1, 4) -replace (':|\\', '')
|
|
$Path = $_.FullName.Replace("'", "`'") #SQL Formatted Path
|
|
$Path = $Path.Replace("X:\", "\\mpe.ca\datadrive\")
|
|
$projectnumber = $result.tostring()
|
|
$DBConnect = New-SqliteConnection -DataSource $PathToDB_Copy
|
|
$Query = "Select Project,fld_LastRefresh FROM FolderData where Server = '$Server' AND Path = `"$Path`";"
|
|
$sql_result = Invoke-SqliteQuery -DataSource $PathToDB_Copy -Query $Query
|
|
|
|
|
|
if (($sql_result.project -eq $null) -or ($sql_result.fld_LastRefresh -le (Get-Date).AddDays($RefreshDays).ToShortDateString())) {
|
|
$CurentLoopProgress = @{
|
|
ID = $JobID
|
|
Activity = "Loading Telemetry for " + $_.FullName
|
|
PercentComplete = 75
|
|
}
|
|
|
|
Write-Progress @CurentLoopProgress
|
|
|
|
if ($sql_result.project -ne $null) {
|
|
# found a record, but needs updating - delete old record from DB
|
|
$Query = "Delete from FolderData WHERE Server = '$Server' AND Path = `"$Path`""
|
|
Invoke-SqliteQuery -DataSource $PathToDB_Copy -Query $Query
|
|
|
|
|
|
}
|
|
|
|
$result3 = [Regex]::Matches($_.FullName, "^(.*[\\\/])") # This gets everything up the last slash, thus the "parent"
|
|
$FolderPath_Data = Get-ChildItem -Path $_.FullName -File -Depth 50 -Recurse
|
|
$folder_Parent = $result3.value.replace("'", "`'") #SQL Formatting
|
|
$folder_Parent = $folder_Parent.Replace("X:\", "\\mpe.ca\datadrive\")
|
|
$folder_FileSize = ($FolderPath_Data | Measure -sum Length).sum / 1024 / 1024 / 1024
|
|
$folder_FileCount = ($FolderPath_Data | measure).Count
|
|
$folder_LastWrite = ($FolderPath_Data | measure LastWriteTime -Maximum).Maximum
|
|
$folder_LastAccess = ($FolderPath_Data | measure LastAccessTime -Maximum).Maximum
|
|
|
|
if ($folder_FileSize -le 0 -or $folder_FileCount -eq 0) {
|
|
|
|
#Let's ignore Null Values
|
|
}
|
|
else {
|
|
|
|
$out = [PSCustomObject]@{
|
|
Server = $Server
|
|
Parent = $folder_Parent
|
|
Path = $Path
|
|
FileCount = $folder_FileCount
|
|
FileSize = $folder_FileSize
|
|
FileLastWrite = $folder_LastWrite
|
|
FileLastAccess = $folder_LastAccess
|
|
Status = $null # added to support Migration Status
|
|
fld_MigrationID = $null
|
|
fld_LastRefresh = (Get-Date).ToShortDateString()
|
|
} | Out-DataTable
|
|
|
|
Invoke-SQLiteBulkCopy -DataSource $PathToDB_Copy -Table "FolderData" -DataTable $out -Force
|
|
|
|
}
|
|
}
|
|
$DBConnect.Close()
|
|
}
|
|
Write-Progress @CurentLoopProgress -Completed
|
|
}
|
|
Write-Progress @ServerProgress -Completed
|
|
} -ThrottleLimit 3
|
|
|
|
$ServerProgress = @{
|
|
ID = 1
|
|
Activity = "Database Work"
|
|
PercentComplete = 80
|
|
# CurrentOperation = $_.Project
|
|
}
|
|
Write-Progress @ServerProgress
|
|
|
|
<#
|
|
TODO Grab data from Egnyte Working Copy to re-incorporate into our DB. This will allow us to mark data as "in progress", and thus filter it out from future data inventory updates.
|
|
TODO Need to update Working Copy sheet to contain Project Number and Server for unique keys, and add antoher column for Egnyte Friendly Server Names to match the Migration Server names.
|
|
IE,
|
|
server,path,path2,etc,status,OriginalServer=RD,OriginalProject=ProjectNumber
|
|
|
|
|
|
#>
|
|
|
|
<# Get Migration Status
|
|
CREATE TABLE "MigrationStatus" (
|
|
"MigrationID" TEXT NOT NULL UNIQUE,
|
|
"MigrationName" TEXT,
|
|
"MigrationFolderSource" TEXT,
|
|
"MigrationFolderDestination" TEXT,
|
|
"MigrationStatus" INTEGER,
|
|
PRIMARY KEY("MigrationID")
|
|
);
|
|
|
|
#>
|
|
|
|
$MigrationStatus_import = Import-Excel -Path $PAth_To_Migration_Status -WorksheetName "MPE Migration Tracker" -StartRow 2
|
|
foreach ($status in $MigrationStatus_import) {
|
|
$SQLSourcePath = $status.'Source Path'.replace("'", "`'") #SQL Formatting
|
|
if ($SQLSourcePath -notmatch '\\$') {
|
|
$SQLSourcePath += '\'
|
|
}
|
|
$SQLDestPath = $status.'Destination Path'.replace("'", "`'") #SQL Formatting
|
|
if ($SQLDestPath -notmatch '\/$') {
|
|
$SQLDestPath += '/'
|
|
}
|
|
$SQLMigrationID = $status.'Migration ID'
|
|
$SQLMigrationName = $status.'Migration Name'
|
|
$SQLMigrationStatus = $status.'Current State'
|
|
|
|
$Query = "Select * from MigrationStatus WHERE MigrationID = `'$SQLMigrationID`'"
|
|
$Test = Invoke-SqliteQuery -DataSource $PathToDB -Query $Query
|
|
|
|
if ($test) {
|
|
$Query = "UPDATE MigrationStatus SET MigrationStatus = '$SQLMigrationStatus' WHERE MigrationID = '$SQLMigrationID'"
|
|
Invoke-SqliteQuery -DataSource $PathToDB -Query $Query
|
|
}
|
|
else {
|
|
$Query = "INSERT INTO MigrationStatus VALUES ('$SQLMigrationID','$SQLMigrationName',`'$SQLSourcePath`',`'$SQLDestPath`','$SQLMigrationStatus','')"
|
|
Invoke-SqliteQuery -DataSource $PathToDB -Query $Query
|
|
}
|
|
|
|
|
|
}
|
|
|
|
# Update DB with new Data from MigrationStatus
|
|
$Query = 'update FolderData SET fld_MigrationID = (SELECT MigrationID from MigrationStatus where Parent = MigrationFolderSource);'
|
|
Invoke-SqliteQuery -DataSource $PathToDB -Query $Query
|
|
|
|
## DB Now contains MigrationID in fld_MigrationID Column. We can now reliably track the individual folder status'
|
|
$query = "update FolderData set Status = (Select MigrationStatus from MigrationStatus where fld_MigrationID = MigrationID);"
|
|
Invoke-SqliteQuery -DataSource $PathToDB -Query $Query
|
|
|
|
|
|
|
|
## Kick off GenTables
|
|
|
|
$SQLFile_to_Run = $PSScriptRoot + '\GenTables.sql'
|
|
Invoke-SqliteQuery -DataSource $PathToDB -InputFile $SQLFile_to_Run
|
|
$SQLFile_to_Run = $PSScriptRoot + '\DuplicatePairing.sql'
|
|
Invoke-SqliteQuery -DataSource $PathToDB -InputFile $SQLFile_to_Run
|
|
|
|
$DBConnect = New-SqliteConnection -DataSource $PathToDB
|
|
|
|
foreach ($office in $OfficeList) {
|
|
$OfficeServer = $office.Name
|
|
|
|
$Query = "select * from OfficeDuplicates where Server = '$OfficeServer';"
|
|
$sql_result = Invoke-SqliteQuery -DataSource $PathToDB -Query $Query
|
|
|
|
if ($sql_result) {
|
|
$OutFile = $OutputFolder + "\$OfficeServer Duplicates.xlsx"
|
|
Remove-Item -Path $OutFile -Force
|
|
$sql_result | Export-Excel -Path $OutFile -AutoFilter
|
|
|
|
}
|
|
}
|
|
# Generate MPE All Xlsx
|
|
$Query = "select * from OfficeDuplicates;"
|
|
$sql_result = Invoke-SqliteQuery -DataSource $PathToDB -Query $Query
|
|
|
|
if ($sql_result) {
|
|
$OutFile = $OutputFolder + "\MPE All Duplicates.xlsx"
|
|
Remove-Item -Path $OutFile -Force
|
|
$sql_result | Export-Excel -Path $OutFile -AutoFilter
|
|
|
|
}
|
|
|
|
# Generate Parent Non-Duplicates
|
|
|
|
$Query = "select * from NonDupParent;"
|
|
$sql_result = Invoke-SqliteQuery -DataSource $PathToDB -Query $Query
|
|
|
|
if ($sql_result) {
|
|
$OutFile = $OutputFolder + "\MPE Non-Duplicates - Parent Folders.xlsx"
|
|
Remove-Item -Path $OutFile -Force
|
|
$sql_result | Export-Excel -Path $OutFile -AutoFilter
|
|
|
|
}
|
|
|
|
|
|
# Generate Project Non-Duplicates
|
|
|
|
$Query = "select * from NonDupProject where Path NOT IN (select Path from NonDupParent);"
|
|
$sql_result = Invoke-SqliteQuery -DataSource $PathToDB -Query $Query
|
|
|
|
if ($sql_result) {
|
|
$OutFile = $OutputFolder + "\MPE Non-Duplicates - Project Folders.xlsx"
|
|
Remove-Item -Path $OutFile -Force
|
|
$sql_result | Export-Excel -Path $OutFile -AutoFilter
|
|
|
|
}
|
|
|
|
## Generate Egnyte Data Inventory Sheet
|
|
|
|
$OutFile = $OutputFolder + "\MPE Data Inventory " + (Get-Date -Format FileDate) + ".xlsx"
|
|
try {
|
|
|
|
Remove-Item -Path $OutFile -Force -ErrorAction SilentlyContinue
|
|
}
|
|
catch {
|
|
<#Do this if a terminating exception happens#>
|
|
}
|
|
$SQLFile_to_Run = $PSScriptRoot + '\Generate Egnyte Export.sql'
|
|
Invoke-SqliteQuery -DataSource $PathToDB -InputFile $SQLFile_to_Run
|
|
$EgnyteExport = Invoke-SqliteQuery -DataSource $PathToDB -Query "Select Server,UNCPath,EgnytePath,FileCount,FileSize,Source from DataInventory"
|
|
|
|
if ($EgnyteExport) {
|
|
|
|
$EgnyteExport | Export-Excel -Path $OutFile -AutoFilter
|
|
}
|
|
|
|
|
|
|
|
$DBConnect.Close()
|
|
Write-Progress @ServerProgress -completed
|
|
|