示例#1
0
        public String ProcessInput(String input, Encoding SourceEncoding, Encoding TargetEncoding)
        {
            String nv = input;

            if (nv.isNullOrEmpty())
            {
                nv = "";
                return(nv);
            }

            if (RecodeInput)
            {
                if ((SourceEncoding != null) && (TargetEncoding != null))
                {
                    Byte[] bytes = SourceEncoding.GetBytes(nv); // htmlDocument.StreamEncoding.GetBytes(nv); // Encoding.ASCII.GetBytes(v);
                    nv = TargetEncoding.GetString(bytes);       // htmlDocument.Encoding.GetString(bytes); // Encoding.UTF8.GetString(bytes);
                }
            }

            nv = HtmlEntity.DeEntitize(nv);

            if (!transliteration_setname.isNullOrEmpty())
            {
                nv = imbNLP.Transliteration.transliterationTool.transliterate(nv, transliteration_setname);
            }

            if (UseStopWords)
            {
                foreach (String wc in StopWords)
                {
                    nv = nv.Replace(wc, "");
                }
            }

            if (trimInput)
            {
                nv = ExtractorTools.ValueCleanUp(nv, preserve_newlines);
            }

            if (UseNoDataWillCards)
            {
                foreach (String wc in NoDataWillCards)
                {
                    if (nv == wc)
                    {
                        nv = "";
                    }
                }
            }

            return(nv);
        }
示例#2
0
        //public reportExpandedData ExtractorCustomizationSettings { get; set; } = new reportExpandedData();

        public virtual void DeployCustomizationSettings(reportExpandedData ExtractorCustomizationSettings)
        {
            ExtractorTools.SetSettingsFromData(this, ExtractorCustomizationSettings);
        }