D
dhilip gopalan
Guest
I have my code which does collect the list of directories and saves it to an CSV output (DirectoryOutputfile.csv in my example). Using the directory list CSV file I use a recursive function and perform the task for each directory.
The task involves inputting the each directory and initiating the process and saves the output to another CSV. This happens for each directory and saves the output.
Also I am saving the completed directories into another CSV to know how many are being complete to view on LIVE basis.
My ask: I am not using any threading in my case, so would like to make the process run in parallel to make it fast and have the output saved as mentioned above. I am new to the threading, kindly suggest how can I use parallel processing or multi-threading in my code to speed up as there are around ~750K directories in the list.
I am not sure where would I need to implement this in my code as I have write and read operations using streamwriter and streamreader at multiple places.
Code below:
public static void OutputSigned(string dir, string outputdir, string checkdir)
{
string filenameOutput = "\\checkoutput_" + DateTime.Now.ToString("yyyy_MM_dd_HHmmss") + ".csv";
if (!File.Exists(outputdir + "\\DirectoryOutputfile.csv"))
{
var directories = DirectorySearch.GetDirectories(dir); //Gets the list of directories
directories.Sort();
DirectoriesToCSV(directories, outputdir); //Method to output the directory LIST to CSV file
}
using (StreamWriter writer = new StreamWriter(outputdir + filenameOutput)) //Creates output CSV file and writes the scanned files update
{
writer.AutoFlush = true;
using (FileStream fileStreamDirectory = File.Open(outputdir + "\\DirectoryOutputfile.csv", FileMode.Open, FileAccess.Read, FileShare.ReadWrite)) //Read directories from the DirectoryOutputfile CSV file
using (BufferedStream bufferStreamDirectory = new BufferedStream(fileStreamDirectory))
using (StreamReader streamReaderDirectory = new StreamReader(bufferStreamDirectory))
{
var directoryLineCountinCSV = File.ReadLines(outputdir + "\\DirectoryOutputfile.csv").Count(); //Counts the numver of directory lines in DirectoryOutputfile.csv output file
using (StreamWriter DirectoryLineUpdatedSofarInCSV = new StreamWriter(outputdir + "\\DirectoryLineUpdatedSofar" + filenameOutput.Replace("\\checkoutput", ""))) //Creates CSV file with the list of already scanned directories
{
DirectoryLineUpdatedSofarInCSV.AutoFlush = true;
string Directoryline;
while ((Directoryline = streamReaderDirectory.ReadLine()) != null)
{
if (Directory.Exists(Directoryline))
{
ProcessStartInfo ProcessStartInfo = new ProcessStartInfo
{
FileName = checkdir + "\\testing.exe",
Arguments = "-a -h -i -l " + Directoryline,
RedirectStandardOutput = true,
UseShellExecute = false,
CreateNoWindow = true
};
using (Process checkProcess = Process.Start(ProcessStartInfo))
{
var line = string.Empty;
using (StreamReader streamReader = checkProcess.StandardOutput)
{
while (!streamReader.EndOfStream)
{
var content = streamReader.ReadLine();
#Doing some task here
writer.WriteLine("Updating the data in CSV file");
}
}
checkProcess.WaitForExit(10000); //Waits for the process to exit
}
}
DirectoryLineUpdatedSofarInCSV.WriteLine("{0},Completed", Directoryline);
}
}
}
}
}
public static void DirectoriesToCSV(List<string> DirectoriesList, string outputdir)
{
using (StreamWriter directoryWriter = new StreamWriter(outputdir + "\\DirectoryOutputfile.csv"))
{
foreach (string directoryline in DirectoriesList)
{
directoryWriter.WriteLine(directoryline);
}
}
}
Thanks, Dhilip
Continue reading...
The task involves inputting the each directory and initiating the process and saves the output to another CSV. This happens for each directory and saves the output.
Also I am saving the completed directories into another CSV to know how many are being complete to view on LIVE basis.
My ask: I am not using any threading in my case, so would like to make the process run in parallel to make it fast and have the output saved as mentioned above. I am new to the threading, kindly suggest how can I use parallel processing or multi-threading in my code to speed up as there are around ~750K directories in the list.
I am not sure where would I need to implement this in my code as I have write and read operations using streamwriter and streamreader at multiple places.
Code below:
public static void OutputSigned(string dir, string outputdir, string checkdir)
{
string filenameOutput = "\\checkoutput_" + DateTime.Now.ToString("yyyy_MM_dd_HHmmss") + ".csv";
if (!File.Exists(outputdir + "\\DirectoryOutputfile.csv"))
{
var directories = DirectorySearch.GetDirectories(dir); //Gets the list of directories
directories.Sort();
DirectoriesToCSV(directories, outputdir); //Method to output the directory LIST to CSV file
}
using (StreamWriter writer = new StreamWriter(outputdir + filenameOutput)) //Creates output CSV file and writes the scanned files update
{
writer.AutoFlush = true;
using (FileStream fileStreamDirectory = File.Open(outputdir + "\\DirectoryOutputfile.csv", FileMode.Open, FileAccess.Read, FileShare.ReadWrite)) //Read directories from the DirectoryOutputfile CSV file
using (BufferedStream bufferStreamDirectory = new BufferedStream(fileStreamDirectory))
using (StreamReader streamReaderDirectory = new StreamReader(bufferStreamDirectory))
{
var directoryLineCountinCSV = File.ReadLines(outputdir + "\\DirectoryOutputfile.csv").Count(); //Counts the numver of directory lines in DirectoryOutputfile.csv output file
using (StreamWriter DirectoryLineUpdatedSofarInCSV = new StreamWriter(outputdir + "\\DirectoryLineUpdatedSofar" + filenameOutput.Replace("\\checkoutput", ""))) //Creates CSV file with the list of already scanned directories
{
DirectoryLineUpdatedSofarInCSV.AutoFlush = true;
string Directoryline;
while ((Directoryline = streamReaderDirectory.ReadLine()) != null)
{
if (Directory.Exists(Directoryline))
{
ProcessStartInfo ProcessStartInfo = new ProcessStartInfo
{
FileName = checkdir + "\\testing.exe",
Arguments = "-a -h -i -l " + Directoryline,
RedirectStandardOutput = true,
UseShellExecute = false,
CreateNoWindow = true
};
using (Process checkProcess = Process.Start(ProcessStartInfo))
{
var line = string.Empty;
using (StreamReader streamReader = checkProcess.StandardOutput)
{
while (!streamReader.EndOfStream)
{
var content = streamReader.ReadLine();
#Doing some task here
writer.WriteLine("Updating the data in CSV file");
}
}
checkProcess.WaitForExit(10000); //Waits for the process to exit
}
}
DirectoryLineUpdatedSofarInCSV.WriteLine("{0},Completed", Directoryline);
}
}
}
}
}
public static void DirectoriesToCSV(List<string> DirectoriesList, string outputdir)
{
using (StreamWriter directoryWriter = new StreamWriter(outputdir + "\\DirectoryOutputfile.csv"))
{
foreach (string directoryline in DirectoriesList)
{
directoryWriter.WriteLine(directoryline);
}
}
}
Thanks, Dhilip
Continue reading...