public IndexBuildResults CreateIndex(FileInfo fileInfo) { try { if (fileInfo.Exists) { var source = CodeSource.GetCodeSource(fileInfo, FilesContentHelper.ReadAllText(fileInfo.FullName)); var words = new HashSet <string>(); AddHintWords(words, source.Content); var doc = IndexBuilderHelper.GetDocumentFromSource(source); CodeIndexPool.UpdateIndex(GetNoneTokenizeFieldTerm(nameof(CodeSource.FilePath), source.FilePath), doc); foreach (var word in words) { HintIndexPool.UpdateIndex(new Term(nameof(CodeWord.Word), word), new Document { new StringField(nameof(CodeWord.Word), word, Field.Store.YES), new StringField(nameof(CodeWord.WordLower), word.ToLowerInvariant(), Field.Store.YES) }); } Log.LogInformation($"{Name}: Create index For {source.FilePath} finished"); } return(IndexBuildResults.Successful); } catch (Exception ex) { Log.LogError($"{Name}: Create index for {fileInfo.FullName} failed, exception: " + ex); if (ex is IOException) { return(IndexBuildResults.FailedWithIOException); } else if (ex is OperationCanceledException) { throw; } return(IndexBuildResults.FailedWithError); } }
public IndexBuildResults UpdateIndex(FileInfo fileInfo, CancellationToken cancellationToken) { try { if (fileInfo.Exists) { cancellationToken.ThrowIfCancellationRequested(); var source = CodeSource.GetCodeSource(fileInfo, FilesContentHelper.ReadAllText(fileInfo.FullName)); var words = new HashSet <string>(); AddHintWords(words, source.Content); var doc = IndexBuilderHelper.GetDocumentFromSource(source); CodeIndexPool.UpdateIndex(GetNoneTokenizeFieldTerm(nameof(CodeSource.FilePath), source.FilePath), doc, out var rawDocuments); if (rawDocuments.Length >= 1) { var rawWords = new HashSet <string>(); AddHintWords(rawWords, GetCodeSourceFromDocument(rawDocuments[0]).Content); var wordsNeedToRemove = rawWords.Except(words).ToArray(); var wordsNeedToAdd = words.Except(rawWords); words = wordsNeedToAdd.ToHashSet(); Log.LogInformation($"{Name}: Find {wordsNeedToRemove.Length} Delete Candidates Words, {words.Count} Update Candidates Words With Path {source.FilePath}"); if (rawDocuments.Length > 1) { Log.LogError($"{Name}: Find {rawDocuments.Length} Documents With Path {source.FilePath} To Update"); } foreach (var needToDeleteWord in wordsNeedToRemove) { if (!CodeIndexPool.Exists(new TermQuery(new Term(GetCaseSensitiveField(nameof(CodeSource.Content)), needToDeleteWord)))) { HintIndexPool.DeleteIndex(new Term(nameof(CodeWord.Word), needToDeleteWord)); } } } else { Log.LogError($"{Name}: Find 0 Document To Update With Path {source.FilePath}, Create New Index"); } foreach (var word in words) { HintIndexPool.UpdateIndex(new Term(nameof(CodeWord.Word), word), new Document { new StringField(nameof(CodeWord.Word), word, Field.Store.YES), new StringField(nameof(CodeWord.WordLower), word.ToLowerInvariant(), Field.Store.YES) }); } Log.LogInformation($"{Name}: Update index For {source.FilePath} finished"); } return(IndexBuildResults.Successful); } catch (Exception ex) { Log.LogError($"{Name}: Update index for {fileInfo.FullName} failed, exception: " + ex); if (ex is IOException) { return(IndexBuildResults.FailedWithIOException); } else if (ex is OperationCanceledException) { throw; } return(IndexBuildResults.FailedWithError); } }
void BuildIndex(bool needCommit, bool triggerMerge, bool applyAllDeletes, List <Document> codeDocuments, HashSet <string> newHintWords, CancellationToken cancellationToken, bool brandNewBuild) { cancellationToken.ThrowIfCancellationRequested(); Log.LogInformation($"{Name}: Build code index start, documents count {codeDocuments.Count}"); Parallel.ForEach( codeDocuments, () => new List <Document>(), (codeDocument, status, documentLists) => { documentLists.Add(codeDocument); return(documentLists); }, documentLists => { if (documentLists.Count > 0) { CodeIndexPool.BuildIndex(documentLists, needCommit, triggerMerge, applyAllDeletes); } }); Log.LogInformation($"{Name}: Build code index finished"); Log.LogInformation($"{Name}: Build {(brandNewBuild ? "brand New" : "exist")} hint index start, documents count {newHintWords.Count}"); if (brandNewBuild) { Parallel.ForEach( newHintWords, () => new List <Document>(), (word, status, documentLists) => { documentLists.Add(new Document { new StringField(nameof(CodeWord.Word), word, Field.Store.YES), new StringField(nameof(CodeWord.WordLower), word.ToLowerInvariant(), Field.Store.YES) }); return(documentLists); }, documentLists => { if (documentLists.Count > 0) { HintIndexPool.BuildIndex(documentLists, needCommit, triggerMerge, applyAllDeletes); } }); } else { Parallel.ForEach(newHintWords, word => { HintIndexPool.UpdateIndex(new Term(nameof(CodeWord.Word), word), new Document { new StringField(nameof(CodeWord.Word), word, Field.Store.YES), new StringField(nameof(CodeWord.WordLower), word.ToLowerInvariant(), Field.Store.YES) }); }); if (needCommit || triggerMerge || applyAllDeletes) { HintIndexPool.Commit(); } } Log.LogInformation($"{Name}: Build hint index finished"); }