C# (CSharp) Docodo WebDataSource.FromHtml示例

编程语言: C# (CSharp)

命名空间/包名称: Docodo

类/类型: WebDataSource

方法/功能: FromHtml

hotexamples.com的示例: 2

C# (CSharp) Docodo WebDataSource.FromHtml - 已找到2个示例。这些是从开源项目中提取的最受好评的Docodo.WebDataSource.FromHtml现实C# (CSharp)示例。您可以评价示例，以帮助我们提高示例质量。

常用方法

显示隐藏

FromHtml(2)

FromUrl(1)

示例#1

显示文件

        public static IIndexDocument FromFile(string file, IIndexDataSource parent)
        {
            string s = file.ToLower();

            if (s.EndsWith(".pdf"))
            {
                // PDF
                return(new IndexPDFDocument(file, parent));
            }
            else
            if (s.EndsWith(".txt"))
            {
                return(new IndexedTextFile(file, parent));
            }
            else
            if ((s.EndsWith(".html")) || (s.EndsWith(".html")))
            {
                using (FileStream fs = File.OpenRead(file))
                {
                    return(WebDataSource.FromHtml(fs, file, parent.Name));
                }
            }

            return(null);
        }

示例#2

显示文件

文件： DBDataSource.cs 项目： alexarchen/Docodo

        /// Add document from BLOB
        public virtual void AddRecord(string name, Stream stream, string fields, ConcurrentQueue <IIndexDocument> queue)
        {
            bool           isText = false;
            IIndexDocument doc    = null;

            AddRecordBase(name, fields);

            if ((indexType == IndexType.File) || (indexType != IndexType.Blob))
            {
                throw new InvalidDataException("Adding record of wrong IndexType");
            }

            BinaryReader reader = new BinaryReader(stream);

            byte[] buff = new byte[4000];
            reader.Read(buff, 0, 4000);
            String det = Encoding.UTF8.GetString(buff, 0, buff.Length);

            stream.Seek(0, SeekOrigin.Begin);
            reader.Dispose();

            // detect type
            if ((buff[0] == '%') && (buff[1] == 'P') && (buff[2] == 'D') && (buff[3] == 'F'))
            {
                DocumentsDataSource.IndexPDFDocument pdf = new DocumentsDataSource.IndexPDFDocument(name, stream, this);
                if (fields != null)
                {
                    pdf.headers = () => { return(fields); }
                }
                ;
                doc = pdf;
            }
            else
            if (det.Contains("<html"))
            {
                IndexPagedTextFile file = WebDataSource.FromHtml(stream, name, Name);
                if (fields != null)
                {
                    file.SetHeaders(fields);
                }
            }
            else
            {
                // detect charset
                Ude.CharsetDetector detector = new Ude.CharsetDetector();
                detector.Feed(buff, 0, buff.Length);
                detector.DataEnd();
                if (detector.Charset != null)
                {
                    Encoding enc = Portable.Text.Encoding.GetEncoding(detector.Charset);
                    using (StreamReader sreader = new StreamReader(stream, enc, false)) {
                        doc = new IndexPagedTextFile("", sreader.ReadToEnd(), fields != null ? fields : "");
                    }
                }
            }

            if (doc != null)
            {
                Enqueue(queue, doc);
            }
        }