Example #1
0
        protected override void ParseContent(ContentRevisionDTO contentrevision)
        {
            try
            {
                var loadedContent = webGetutf.Load(contentrevision.Content.Contents_URL);

                //var checkifdeprecated = loadedContent.DocumentNode.SelectNodes("//div(@class='whole_box')").ToList().Where(p => p.InnerText.Trim() == "해당 게시물이 존재하지 않습니다.");
                //if (checkifdeprecated != null)
                //{
                //    contentrevision.isDepricate = true;
                //    return;
                //}

                //var content_count = 0;SSS
                List <string> details        = new List <string>();
                var           articlecontent = loadedContent.DocumentNode.SelectNodes("//div[@class = 'view_content']").SingleOrDefault();
                contentrevision.Details      = articlecontent.InnerText.Trim();
                contentrevision.Details_Html = articlecontent.InnerHtml.Trim();
                contentrevision.isDepricate  = false;

                var imgnodes = articlecontent.SelectNodes(".//img");

                contentrevision.SrcDatas = new List <SrcdataDTO>();
                if (imgnodes == null)
                {
                    return;
                }

                foreach (var img in imgnodes)
                {
                    var srcurl  = new Uri(img.GetAttributeValue("src", "default"));
                    var srcdata = new SrcdataDTO
                    {
                        SourceUrl    = srcurl.AbsoluteUri,
                        IsDepricated = false,
                        FileName     = System.IO.Path.GetFileName(srcurl.LocalPath),
                        SrcGuId      = Guid.NewGuid(),
                    };
                    img.SetAttributeValue("guid", srcdata.SrcGuId.ToString());

                    contentrevision.SrcDatas.Add(srcdata);
                }
            }
            catch (ArgumentNullException)
            {
                contentrevision.isDepricate = true;
                return;
            }
            catch (UriFormatException)
            {
                return;
            }
            catch (Exception e)
            {
                Console.WriteLine("ReStart");
                ParseContent(contentrevision);
            }
        }
Example #2
0
        //details_html 쪼개는 함수
        protected override void ParseContent(ContentRevisionDTO contentrevision)
        {
            try
            {
                var loadedContent = webGetutf.Load(contentrevision.Content.Contents_URL);

                var checkifdeprecated = loadedContent.DocumentNode.SelectNodes("//li[@class = 'hx_cate']");
                if (checkifdeprecated != null && checkifdeprecated.FirstOrDefault().InnerText.Trim() == "삭제된 글입니다.")
                {
                    contentrevision.isDepricate = true;
                    return;
                }

                var articlecontent = loadedContent.DocumentNode.SelectNodes("//div[@id = 'copy_layer_1']").LastOrDefault();

                contentrevision.Details      = articlecontent.InnerText.Trim();
                contentrevision.Details_Html = articlecontent.InnerHtml.Trim();
                contentrevision.isDepricate  = false;

                var imgnodes = articlecontent.SelectNodes(".//img");

                contentrevision.SrcDatas = new List <SrcdataDTO>();

                if (imgnodes == null)
                {
                    return;
                }

                foreach (var img in imgnodes)
                {
                    var srcurl  = new Uri(img.GetAttributeValue("src", "default"));
                    var srcdata = new SrcdataDTO
                    {
                        SourceUrl    = srcurl.AbsoluteUri,
                        IsDepricated = false,
                        FileName     = System.IO.Path.GetFileName(srcurl.LocalPath),
                        SrcGuId      = Guid.NewGuid(),
                    };
                    img.SetAttributeValue("guid", srcdata.SrcGuId.ToString());

                    contentrevision.SrcDatas.Add(srcdata);
                }
            }
            catch (ArgumentNullException)
            {
                contentrevision.isDepricate = true;
                return;
            }
            catch (UriFormatException)
            {
                return;
            }
            catch (Exception e)
            {
                Console.WriteLine("ReStart");
                ParseContent(contentrevision);
            }
        }
Example #3
0
        //content 내용, html 가져오는 함수
        protected override void ParseContent(ContentRevisionDTO contentrevision)
        {
            //var content_count = 0;
            try
            {
                var loadedContent  = webGetutf.Load(contentrevision.Content.Contents_URL);
                var articlecontent = loadedContent.DocumentNode.SelectNodes("//div[@id = 'body_frame']").FirstOrDefault();
                foreach (var ct in articlecontent.Descendants())
                {
                    if (ct.Name == "style")
                    {
                        ct.InnerHtml = "";
                    }
                }

                contentrevision.Details      = articlecontent.InnerText.Trim();
                contentrevision.Details_Html = articlecontent.InnerHtml.Trim();
                contentrevision.isDepricate  = false;

                var imgnodes = articlecontent.SelectNodes("./img");

                contentrevision.SrcDatas = new List <SrcdataDTO>();
                if (imgnodes == null)
                {
                    return;
                }

                foreach (var img in imgnodes)
                {
                    var srcurl  = new Uri(img.GetAttributeValue("src", "default"));
                    var srcdata = new SrcdataDTO
                    {
                        SourceUrl    = srcurl.AbsoluteUri,
                        IsDepricated = false,
                        FileName     = System.IO.Path.GetFileName(srcurl.LocalPath),
                        SrcGuId      = Guid.NewGuid(),
                    };
                    img.SetAttributeValue("guid", srcdata.SrcGuId.ToString());

                    contentrevision.SrcDatas.Add(srcdata);
                }
            }
            catch (ArgumentNullException)
            {
                contentrevision.isDepricate = true;
                return;
            }
            catch (UriFormatException)
            {
                return;
            }
            catch (Exception e)
            {
                Console.WriteLine("ReStart");
                ParseContent(contentrevision);
            }
        }
Example #4
0
        protected override void ParseContent(ContentRevisionDTO contentrevision)
        {
            try
            {
                var loadedContent = webGetutf.Load(contentrevision.Content.Contents_URL);

                var articlecontent = loadedContent.DocumentNode.SelectNodes("//div[@id = 'pann-content']").FirstOrDefault();
                contentrevision.Details      = articlecontent.InnerText.Trim();
                contentrevision.Details_Html = articlecontent.InnerHtml.Trim();
                contentrevision.isDepricate  = false;

                var imgnodes = articlecontent.SelectNodes(".//img");

                contentrevision.SrcDatas = new List <SrcdataDTO>();
                if (imgnodes == null)
                {
                    return;
                }

                foreach (var img in imgnodes)
                {
                    var srcurl  = new Uri(img.GetAttributeValue("src", "default"));
                    var srcdata = new SrcdataDTO
                    {
                        SourceUrl    = srcurl.AbsoluteUri,
                        IsDepricated = false,
                        FileName     = System.IO.Path.GetFileName(srcurl.LocalPath),
                        SrcGuId      = Guid.NewGuid(),
                    };
                    img.SetAttributeValue("guid", srcdata.SrcGuId.ToString());

                    contentrevision.SrcDatas.Add(srcdata);
                }
            }
            catch (ArgumentNullException)
            {
                contentrevision.isDepricate = true;
                return;
            }
            catch (UriFormatException)
            {
                return;
            }
            catch (WebException wex)
            {
                if (((HttpWebResponse)wex.Response).StatusCode == HttpStatusCode.NotFound)
                {
                    // error 404, do what you need to do
                }
            }
            catch (Exception e)
            {
                Console.WriteLine("ReStart");
                ParseContent(contentrevision);
            }
        }
Example #5
0
        protected override void ParseContent(ContentRevisionDTO contentrevision)
        {
            try
            {
                var ruiwebContents = webGetkr.Load(contentrevision.Content.Contents_URL);

                var checkifdeprecated = ruiwebContents.DocumentNode.SelectNodes("//td[@class = 'te2']");
                if (checkifdeprecated != null && checkifdeprecated.FirstOrDefault().InnerText.Trim() == "이미 삭제 된 게시글 입니다.")
                {
                    contentrevision.isDepricate = true;
                    return;
                }
                
                //var content_count = 0;
                List<string> details = new List<string>();
                var content = ruiwebContents.DocumentNode.SelectNodes("//div[@id = 'DocContent']").SingleOrDefault();
                contentrevision.Details = content.InnerText.Trim();
                contentrevision.Details_Html = content.InnerHtml.Trim();
                contentrevision.isDepricate = false;

                var imgnodes = content.SelectNodes(".//img");

                contentrevision.SrcDatas = new List<SrcdataDTO>();
                if (imgnodes == null) return;

                foreach (var img in imgnodes)
                {
                    var srcurl = new Uri(img.GetAttributeValue("src", "default"));
                    var srcdata = new SrcdataDTO
                    {
                        SourceUrl = srcurl.AbsoluteUri,
                        IsDepricated = false,
                        FileName = System.IO.Path.GetFileName(srcurl.LocalPath),
                        SrcGuId = Guid.NewGuid(),
                    };
                    img.SetAttributeValue("guid", srcdata.SrcGuId.ToString());

                    contentrevision.SrcDatas.Add(srcdata);
                }
            }
            catch (ArgumentNullException)
            {
                contentrevision.isDepricate = true;
                return;
            }
            catch (UriFormatException)
            {
                return;
            }
            catch (Exception e)
            {
                Console.WriteLine("ReStart");
                ParseContent(contentrevision);
            }
        }