C# (CSharp) TextProcessor HTMLWikiProcessor.ProcessDivHTML Beispiele

Programmiersprache: C# (CSharp)

Namespace / Paketname: TextProcessor

Klasse / Typ: HTMLWikiProcessor

Methode / Funktion: ProcessDivHTML

Beispiele auf hotexamples.com: 2

C# (CSharp) TextProcessor HTMLWikiProcessor.ProcessDivHTML - 2 Beispiele gefunden. Dies sind die am besten bewerteten C# (CSharp) Beispiele für die TextProcessor.HTMLWikiProcessor.ProcessDivHTML, die aus Open Source-Projekten extrahiert wurden. Sie können Beispiele bewerten, um die Qualität der Beispiele zu verbessern.

Häufig verwendete Methoden

Anzeigen Verbergen

LoadDecodedTextClass(1)

ProcessDivHTML(1)

ProcessHTML(1)

Beispiel #1

Datei anzeigen

Datei: Program.cs Projekt: markusmobius/WikiPrepSharp

        static void Main(string[] args)
        {
            StreamReader stream = new StreamReader(args[0]);
            string body = stream.ReadToEnd();
            MemoryManager mem = new MemoryManager(4000000, 4000000);
            DecodedTextClass content = new DecodedTextClass(mem, true);
            HTMLWikiProcessor textproc = new HTMLWikiProcessor(new HashSet<int>(), false);
            textproc.LoadDecodedTextClass(ref content);
            content.resetDecoder();
            textproc.ProcessHTML(body);

            StreamWriter sw = new StreamWriter("words.txt");
            string[] tokens = content.GetTokens();
            sw.Write(string.Join(",", tokens));
            sw.Close();

            // if text is an html page, we can extract the title
            sw = new StreamWriter("title.txt");
            tokens = content.GetTitleTokens();
            sw.Write(string.Join(",", tokens));
            sw.Close();

            // if text is an html page, we can extract text only from within div's with a matching id
            content.resetDecoder(); // need to reset to reuse the DecodedTextClass object
            HashSet<string> divfilters = new HashSet<string>();
            divfilters.Add("id=\"articleBody\"");
            divfilters.Add("class=\"articleBody\"");

            textproc.ProcessDivHTML(body, divfilters);
            sw = new StreamWriter("specificdiv.txt");
            sw.Write(string.Join(",", tokens));
            sw.Close();
        }

Beispiel #2

Datei anzeigen

Datei: Program.cs Projekt: markusmobius/WikiPrepSharp

        static void Main(string[] args)
        {
            StreamReader      stream   = new StreamReader(args[0]);
            string            body     = stream.ReadToEnd();
            MemoryManager     mem      = new MemoryManager(4000000, 4000000);
            DecodedTextClass  content  = new DecodedTextClass(mem, true);
            HTMLWikiProcessor textproc = new HTMLWikiProcessor(new HashSet <int>(), false);

            textproc.LoadDecodedTextClass(ref content);
            content.resetDecoder();
            textproc.ProcessHTML(body);

            StreamWriter sw = new StreamWriter("words.txt");

            string[] tokens = content.GetTokens();
            sw.Write(string.Join(",", tokens));
            sw.Close();

            // if text is an html page, we can extract the title
            sw     = new StreamWriter("title.txt");
            tokens = content.GetTitleTokens();
            sw.Write(string.Join(",", tokens));
            sw.Close();

            // if text is an html page, we can extract text only from within div's with a matching id
            content.resetDecoder(); // need to reset to reuse the DecodedTextClass object
            HashSet <string> divfilters = new HashSet <string>();

            divfilters.Add("id=\"articleBody\"");
            divfilters.Add("class=\"articleBody\"");

            textproc.ProcessDivHTML(body, divfilters);
            sw = new StreamWriter("specificdiv.txt");
            sw.Write(string.Join(",", tokens));
            sw.Close();
        }