Example #1
0
 /// <summary>
 /// Provides a global access point for the single instance of the <see cref="Stemming"/>
 /// class.
 /// </summary>
 /// <returns>A reference to the single instance of <see cref="Stemming"/>.</returns>
 public static Stemming Instance()
 {
     if(instance==null)
     {
         instance=new Stemming();
     }
     return instance;
 }
Example #2
0
 /// <summary>
 /// Provides a global access point for the single instance of the <see cref="Stemming"/>
 /// class.
 /// </summary>
 /// <returns>A reference to the single instance of <see cref="Stemming"/>.</returns>
 public static Stemming Instance()
 {
     if (instance == null)
     {
         instance = new Stemming();
     }
     return(instance);
 }
Example #3
0
 /// <summary>
 /// The constructor is private so that only the class itself can create an instance.
 /// </summary>
 private WordsCache()
 {
     settings = PluginSettings.Instance();
     dbProvider = DBConnectionStringProvider.Instance();
     settings.DBConnectionString = dbProvider.ProvideDBConnectionString("CrawlWave.ServerPlugins.WordExtraction");
     dbcon = new SqlConnection(settings.DBConnectionString);
     words = new Hashtable();
     stemming = Stemming.Instance();
     culture = new CultureInfo("el-GR");
     LoadCache();
 }
Example #4
0
 /// <summary>
 /// The constructor is private so that only the class itself can create an instance.
 /// </summary>
 private WordsCache()
 {
     settings   = PluginSettings.Instance();
     dbProvider = DBConnectionStringProvider.Instance();
     settings.DBConnectionString = dbProvider.ProvideDBConnectionString("CrawlWave.ServerPlugins.WordExtraction");
     dbcon    = new SqlConnection(settings.DBConnectionString);
     words    = new Hashtable();
     stemming = Stemming.Instance();
     culture  = new CultureInfo("el-GR");
     LoadCache();
 }
Example #5
0
 /// <summary>
 /// The private constructor of the WordExtractor class
 /// </summary>
 private WordExtractor()
 {
     mutex              = new Mutex();
     settings           = PluginSettings.Instance();
     regStripTags       = new Regex("<[^>]*>", RegexOptions.CultureInvariant | RegexOptions.Multiline | RegexOptions.IgnoreCase | RegexOptions.Compiled);                                      //<[^>]+> or   >(?:(?<t>[^<]*))
     regStripScripts    = new Regex(@"(?i)<script([^>])*>(\w|\W)*</script([^>])*>", RegexOptions.CultureInvariant | RegexOptions.Multiline | RegexOptions.IgnoreCase | RegexOptions.Compiled); //@"(?i)<script([^>])*>(\w|\W)*</script([^>])*>" or @"<script[^>]*>(\w|\W)*?</script[^>]*>"
     regTitleTags       = new Regex("<\\s*title[^>]*>[^<]*<\\s*/title\\s*>", RegexOptions.CultureInvariant | RegexOptions.Multiline | RegexOptions.IgnoreCase | RegexOptions.Compiled);
     regKeywordTags     = new Regex("<meta\\s*name\\s*=\\s*\"keywords\"\\s*content\\s*=\\s*\"[^>]*\">", RegexOptions.CultureInvariant | RegexOptions.Multiline | RegexOptions.IgnoreCase | RegexOptions.Compiled);
     regDescriptionTags = new Regex("<meta\\s*name\\s*=\\s*\"description\"\\s*content\\s*=\\s*\"[^>]*\">", RegexOptions.CultureInvariant | RegexOptions.Multiline | RegexOptions.IgnoreCase | RegexOptions.Compiled);
     stemming           = Stemming.Instance();
     slStopWordsEnglish = new SortedList(arStopWordsEnglish.Length);
     slStopWordsGreek   = new SortedList(arStopWordsGreek.Length);
     culture            = new CultureInfo("el-GR");
     InitializeWordLists();
 }
Example #6
0
 /// <summary>
 /// The private constructor of the WordExtractor class
 /// </summary>
 private WordExtractor()
 {
     mutex = new Mutex();
     settings = PluginSettings.Instance();
     regStripTags= new Regex("<[^>]*>", RegexOptions.CultureInvariant|RegexOptions.Multiline|RegexOptions.IgnoreCase|RegexOptions.Compiled);//<[^>]+> or   >(?:(?<t>[^<]*))
     regStripScripts=new Regex(@"(?i)<script([^>])*>(\w|\W)*</script([^>])*>",RegexOptions.CultureInvariant|RegexOptions.Multiline|RegexOptions.IgnoreCase|RegexOptions.Compiled); //@"(?i)<script([^>])*>(\w|\W)*</script([^>])*>" or @"<script[^>]*>(\w|\W)*?</script[^>]*>"
     regTitleTags=new Regex("<\\s*title[^>]*>[^<]*<\\s*/title\\s*>",RegexOptions.CultureInvariant|RegexOptions.Multiline|RegexOptions.IgnoreCase|RegexOptions.Compiled);
     regKeywordTags=new Regex("<meta\\s*name\\s*=\\s*\"keywords\"\\s*content\\s*=\\s*\"[^>]*\">", RegexOptions.CultureInvariant|RegexOptions.Multiline|RegexOptions.IgnoreCase|RegexOptions.Compiled);
     regDescriptionTags=new Regex("<meta\\s*name\\s*=\\s*\"description\"\\s*content\\s*=\\s*\"[^>]*\">", RegexOptions.CultureInvariant|RegexOptions.Multiline|RegexOptions.IgnoreCase|RegexOptions.Compiled);
     stemming=Stemming.Instance();
     slStopWordsEnglish=new SortedList(arStopWordsEnglish.Length);
     slStopWordsGreek=new SortedList(arStopWordsGreek.Length);
     culture = new CultureInfo("el-GR");
     InitializeWordLists();
 }