C# (CSharp) document_parser DocumentParser示例

编程语言: C# (CSharp)

命名空间/包名称: document_parser

类/类型: DocumentParser

hotexamples.com的示例: 2

C# (CSharp) document_parser DocumentParser - 已找到2个示例。这些是从开源项目中提取的最受好评的document_parser.DocumentParser现实C# (CSharp)示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

CheckDocumentValidityAfterMetaData(1)

InitForParsing(1)

ParseMetaData(1)

SetGutenbergId(1)

示例#1

显示文件

        /// <summary>
        ///
        /// </summary>
        /// <param name="phrase"></param>
        /// <returns></returns>
        public static DocumentParser FromPhrase(string phrase)
        {
            if (phrase.Length <= 0)
            {
                throw new Exception("The phrase is empty!");
            }

            // make sure CoreNLP is initialized
            if (!VerifyStanfordServiceIsInitialized())
            {
                throw new Exception("Failed to initialize CoreNLP!");
            }

            StanfordDocumentFacade doc =
                StanfordPipelineService.Instance.Annotate(phrase);

            if (doc == null)
            {
                return(null);
            }

            DocumentParser docParser = new DocumentParser(doc);

            if (!docParser.InitForParsing())
            {
                throw new Exception("Empty phrase?!");
            }

            // #fromphrase
            docParser._fromFile = false;

            return(docParser);
        }

示例#2

显示文件

        //--------------------------------------------------------------------------
        /// <summary>
        /// This is how you construct a new DocumentParser
        /// </summary>
        /// <param name="file"></param>
        /// <returns></returns>
        public static DocumentParser FromFile(FileInfo file)
        {
            if (!file.Exists)
            {
                throw new Exception("The document file doesn't exist!");
            }

            // make sure CoreNLP is initialized
            if (!VerifyStanfordServiceIsInitialized())
            {
                throw new Exception("Failed to initialize CoreNLP!");
            }

            StanfordDocumentFacade doc =
                StanfordPipelineService.Instance.Annotate(file);

            if (doc == null)
            {
                return(null);
            }

            DocumentParser docParser = new DocumentParser(doc);

            if (!docParser.ParseMetaData())
            {
                throw new Exception("Failed to get document's start mark!");
            }

            if (!docParser.CheckDocumentValidityAfterMetaData())
            {
                throw new Exception(
                          "The document is invalid - either no content or no end mark!");
            }

            if (!docParser.SetGutenbergId(file))
            {
                throw new Exception("Failed setting Gutenberg Id!");
            }

            docParser._fromFile = true;

            return(docParser);
        }