public FileHash CalculateHashes(byte[] buffer, long offset, int length, Config config)
        {
            var weakHash = CalculateWeakHash(buffer);
            var strongHash = CalculateStrongHash(buffer);

            var fileHash = new FileHash() { Length = length, Offset = offset, WeakHash = weakHash, StrongHash = strongHash };

            return fileHash;
        }
Example #2
0
        static void Main(string[] args)
        {
            var fileProcessor = new FileProcessor();
            var filePath = args[0];
            var config = new Config();
            var sortedDict = fileProcessor.GetHashesForFile(filePath, config);
               foreach (var entry in sortedDict)
            {
                Console.WriteLine("{0}:{1}:{2}:{3}", entry.Value.Offset, entry.Key, Convert.ToBase64String(entry.Value.StrongHash) , entry.Value.Length);
            }
            Console.Clear();

            //var comparisonFile = fileProcessor.GetDiffBlocksForFile(sortedDict, args[1], config);

            Console.WriteLine("Returned: {0} hashes", sortedDict.Count());

            //Console.WriteLine(comparisonFile.Count);
            Console.ReadKey();
        }
Example #3
0
 public void UploadCurrentConfig(Config config, Guid sessionId)
 {
 }
Example #4
0
        public Guid CalculateHashesForFile(Config config, Guid sessionId)
        {
            var fileProcessor = new FileProcessor();
            var filePath = @"D:\\Downloads\\en_windows_7_ultimate_rc_x64_dvd_347803.iso";
            var fileId = Guid.NewGuid();
            fileProcessor.GetHashesForFileBockComplete += delegate(Guid currentFileId)
                                                                  {

                                                                      using (var ds = new DataStoreEntities())
                                                                      {
                                                                          var statusEntry =
                                                                              ds.FileStatuses.Where(
                                                                                  x => x.FileId == fileId)
                                                                          _.FirstOrDefault;

                                                                          if(statusEntry != null)
                                                                          {

                                                                          }

                                                                          else
                                                                          {

                                                                          }
                                                                      }
                                                                  };
            using (var ds = new DataStoreEntities())
            {

                var fileSignature = ds.FileSignatures.Where(x => x.FilePath == filePath).FirstOrDefault();

                if (fileSignature != null)
                {
                    return fileSignature.FileId;

                }

                var progressReporter = new ProgressReporter();

                Task.Factory.StartNew(() =>
                                          {

                                              var fileHashes = fileProcessor.GetHashesForFile(filePath, progressReporter,
                                                                                              config);
                                              using (var ms = new MemoryStream())
                                              {
                                                  var binaryFormatter = new BinaryFormatter();
                                                  binaryFormatter.Serialize(ms, fileHashes);

                                                  ds.FileSignatures.AddObject(new FileSignature()
                                                                                  {
                                                                                      FileId = fileId,
                                                                                      FilePath = filePath,
                                                                                      Signature = ms.ToArray()
                                                                                  });
                                              }
                                              ds.SaveChanges();
                                          });

                return fileId;

            }
        }
        public List<FileChunk> GetChunksForFileBlock(int blockNumber, CancellationToken cancellationToken, 
            ConcurrentDictionary<long, FileHash> remoteHashes, FileStream mappedFile, long fileBlockChunkStartOffset, long chunkLength, ProgressReporter progressReporter, Config config)
        {
            var chunkBuffer = FillBuffer(mappedFile, fileBlockChunkStartOffset, config);
            var windowSize = config.BlockLength;

            //our position in the chunk buffer
            long chunkBufferReadOffset = 0;

            //out position in the actual file block.
            var chunkReadOffset = fileBlockChunkStartOffset;

            //lets us track the 'non matched' blocks.
            var nonMatchStartOffset = chunkBufferReadOffset;

            var windowWeakChecksum = new Adler32();

            var outList = new List<FileChunk>();
            while (chunkReadOffset < chunkLength)
            {
                if (cancellationToken.IsCancellationRequested)
                    return null;

                var buffer = new byte[windowSize];

                if (chunkBufferReadOffset + config.BlockLength >= chunkBuffer.Length)
                {
                    FillBuffer(mappedFile, chunkReadOffset, config);
                    chunkBufferReadOffset = 0;
                }
                //correct for 'end of block' so the buffer array is the right length.
                if (chunkReadOffset + config.BlockLength > chunkLength)
                {
                    windowSize = checked((int)(chunkLength - chunkReadOffset));
                    buffer = new byte[windowSize];
                }

                 Array.ConstrainedCopy(chunkBuffer,(int)chunkBufferReadOffset,buffer,0,windowSize);

                if (chunkBufferReadOffset == 0)
                {
                    windowWeakChecksum.Update(buffer);
                }
                else
                {
                    windowWeakChecksum.Update(buffer, buffer.Length - 1, 1);
                }

                var weakCheckSum = windowWeakChecksum.Value;

                FileHash match;
                remoteHashes.TryGetValue(weakCheckSum, out match);
                if (match != null)
                {
                    var strongHash = CalculateStrongHash(buffer);
                    if (strongHash.SequenceEqual(match.StrongHash))
                    {
                        if (chunkBufferReadOffset > 0)
                        {
                            var nonMatchEndOffset = fileBlockChunkStartOffset - 1;
                            var nonMatchingChunk = new FileChunk
                                                       {
                                                           IsMatch = false,
                                                           BlockLength = nonMatchEndOffset - nonMatchStartOffset,
                                                           SourceOffset = nonMatchStartOffset + fileBlockChunkStartOffset
                                                       };
                            outList.Add(nonMatchingChunk);
                            nonMatchStartOffset = chunkBufferReadOffset + config.BlockLength;
                        }

                        var matchingChunk = new FileChunk
                                                {
                                                    IsMatch = true,
                                                    DestinationOffset = chunkReadOffset,
                                                    SourceOffset = match.Offset,
                                                    BlockLength = config.BlockLength
                                                };
                        outList.Add(matchingChunk);
                        windowWeakChecksum.Reset();
                    }
                }

                if (chunkBufferReadOffset % 100 == 0)
                {
                    long offset = chunkBufferReadOffset;
                    progressReporter.ReportProgress(()=>
                                                         {
                                                             if (DiffBlockScanProgressChanged != null)
                                                                 DiffBlockScanProgressChanged(blockNumber,

                                                                                     ((int)
                                                                                      (offset/chunkLength*100)));

                                                         })
                    ;
                }
                chunkBufferReadOffset += 1;
                chunkReadOffset += 1;
            }
            if (chunkLength - nonMatchStartOffset > 1)
            {
                var nonMatchingChunk = new FileChunk { IsMatch = false, BlockLength = chunkLength - nonMatchStartOffset, SourceOffset = nonMatchStartOffset + chunkBufferReadOffset };
                outList.Add(nonMatchingChunk);
            }
            return outList;
        }
 private byte[] FillBuffer(Stream fileStream, long startOffset, Config config)
 {
     var outArray = new byte[config.BufferSize];
     fileStream.Seek(startOffset, SeekOrigin.Begin);
     fileStream.Read(outArray, 0, outArray.Length);
     return outArray;
 }
        public ConcurrentDictionary<long, FileHash> GetHashesForFile(FileStream file, ProgressReporter progressReporter, Config config)
        {
            var resultDictionary = new ConcurrentDictionary<long, FileHash>();

            var fileLength = file.Length;

            var localBlockLength = config.BlockLength;
            if (fileLength <= localBlockLength)
            {
                localBlockLength = checked((int)fileLength);
            }

            long currentFilePosition = 0;
            var bytesToRead = config.BlockLength;
              var numberOfBlocks = checked((int) fileLength/config.BlockLength);
            var buffer = new byte[bytesToRead];
            var maxTaskCount = config.DegreeOfParalleism * 15;

            if (maxTaskCount >= numberOfBlocks)
                maxTaskCount = numberOfBlocks;

            var taskArray = new List<Task>(maxTaskCount);

                while (currentFilePosition < fileLength)
                {
                    if (currentFilePosition + localBlockLength > fileLength)
                    {
                        bytesToRead = checked((int)(fileLength - currentFilePosition));
                        buffer = new byte[bytesToRead];
                    }
                    var offSetPosition = currentFilePosition;

                    if (file.Read(buffer, 0, bytesToRead) < 0)
                    {
                        break;
                    }

                    currentFilePosition = file.Position;
                    var taskCount = 0;
                    if (taskArray.Count <= maxTaskCount)
                    {
                        taskCount++;
                        byte[] taskBuffer = buffer;
                        int read = bytesToRead;
                        taskArray.Add(Task.Factory.StartNew(() => CalculateHashes(taskBuffer, offSetPosition, read, config))
                                          .ContinueWith(
                                              outHash =>
                                                  {
                                                      resultDictionary.TryAdd(outHash.Result.WeakHash, outHash.Result);

                                                      progressReporter.ReportProgressAsync(
                                                          () =>
                                                              {
                                                                  if (GetHashesForFileBockComplete != null)
                                                                      GetHashesForFileBockComplete(taskCount,
                                                                                                   numberOfBlocks);
                                                              });

                                                  }));
                    }
                    else
                    {
                        var complete = Task.WaitAny(taskArray.ToArray());

                        taskArray.RemoveAt(complete);
                    }
                }

            Task.WaitAll(taskArray.ToArray());

            return resultDictionary;
        }
 public ConcurrentDictionary<long, FileHash> GetHashesForFile(string filepath, ProgressReporter progressReporter, Config config)
 {
     using (var fileStream = File.Open(filepath, FileMode.Open, FileAccess.Read, FileShare.Read))
       {
           return GetHashesForFile(fileStream,progressReporter, config);
       }
 }
 public List<FileChunk> GetDiffBlocksForFile(ConcurrentDictionary<long, FileHash> remoteHashes, string filePath, ProgressReporter progressReporter, Config config)
 {
     using (var fileStream = new FileStream(filePath, FileMode.Open, FileAccess.Read, FileShare.Read))
     {
         return GetDiffBlocksForFile(remoteHashes, fileStream, progressReporter, config);
     }
 }
Example #10
0
        public List<FileChunk> GetDiffBlocksForFile(ConcurrentDictionary<long, FileHash> remoteHashes, FileStream fileStream, ProgressReporter progressReporter, Config config)
        {
            _cancellationSource = new CancellationTokenSource();
               var cancellationToken = _cancellationSource.Token;
               var fileLength = fileStream.Length;

               var lockObj = new object();

               var fileBlockSize = Convert.ToInt64(fileLength / config.DegreeOfParalleism );

               long chunkStart = 0;
               long chunkEnd = 0;
               //really should be concurrentbag but SL doesn't support that.
               var resultBag = new List<FileChunk>();

                   var taskArray = new List<Task>();
                   var chunkCounter = 0;
                   for (var i = 0; i < config.DegreeOfParalleism; i++)
                   {
                       chunkEnd = chunkEnd + fileBlockSize;
                       var chunkOverlap = chunkEnd + config.BlockLength;

                       if (chunkEnd > fileLength)
                       {
                           chunkEnd = fileLength;
                           chunkOverlap = chunkEnd;
                       }

                       if (taskArray.Count() <= config.DegreeOfParalleism)
                       {
                           chunkCounter++;
                           var localChunkStart = chunkStart;
                           var length = chunkOverlap - chunkStart;

                           int counter = chunkCounter;
                           var chunkScanTask = Task.Factory.StartNew(
                               () => GetChunksForFileBlock(counter, cancellationToken, remoteHashes, fileStream, localChunkStart, length, progressReporter, config),
                               cancellationToken, TaskCreationOptions.LongRunning, TaskScheduler.Default)
                               .ContinueWith(
                                   outHash =>
                                       {
                                           lock (lockObj)
                                           {
                                           outHash.Result.ForEach(resultBag.Add);
                                           }
                                       });

                           taskArray.Add(chunkScanTask);

                       }

                       Interlocked.Add(ref chunkStart, fileBlockSize);

                   }
                   Task.WaitAll(taskArray.ToArray());

               return resultBag;
        }