示例#1
0
        protected LanguageModel(CharCounters lowerCaseCharCounts, double upperCaseToLowerCaseFactor)
        {
            lowerCaseFrequencies = lowerCaseCharCounts.ToFrequenciesVector();
            var counters = new CharCounters();

            foreach (var lowerCaseChar in lowerCaseCharCounts.Chars())
            {
                var upperCaseChar    = Char.ToUpperInvariant(lowerCaseChar);
                var lowerCaseCounter = lowerCaseCharCounts.CharCount(lowerCaseChar) * 1000;
                var upperCaseCounter = (int)Math.Round(upperCaseToLowerCaseFactor * lowerCaseCounter);
                counters.AddChar(lowerCaseChar, lowerCaseCounter);
                counters.AddChar(upperCaseChar, upperCaseCounter);
            }

            frequencies = counters.ToFrequenciesVector();
            modelChars  = new HashSet <char>(frequencies.NonZeroComponents().Select(c => (char)c));
        }
示例#2
0
        public double GetCompliance(string text, bool ignoreCase, bool applyModelFilter)
        {
            var charCounters = new CharCounters();

            if (ignoreCase)
            {
                text = text.ToLowerInvariant();
            }

            if (applyModelFilter)
            {
                foreach (var c in text)
                {
                    if (modelChars.Contains(c))
                    {
                        charCounters.AddChar(c);
                    }
                }
            }
            else
            {
                charCounters.AddAllChars(text);
            }

            var textFrequencies = charCounters.ToFrequenciesVector();

            var frequenciesSet = ignoreCase ? lowerCaseFrequencies : frequencies;

            double maxDiff = 0;
            double diff    = 0;

            foreach (var entry in frequenciesSet.NonZeroEntries())
            {
                diff    += Math.Abs(entry.Value - textFrequencies.Get(entry.Key));
                maxDiff += entry.Value;
            }

            var result = (maxDiff - diff) / maxDiff;

            return(result >= 0 ? result: 0);
        }