protected override void ParseContent(ContentRevisionDTO contentrevision) { try { var loadedContent = webGetutf.Load(contentrevision.Content.Contents_URL); //var checkifdeprecated = loadedContent.DocumentNode.SelectNodes("//div(@class='whole_box')").ToList().Where(p => p.InnerText.Trim() == "해당 게시물이 존재하지 않습니다."); //if (checkifdeprecated != null) //{ // contentrevision.isDepricate = true; // return; //} //var content_count = 0;SSS List <string> details = new List <string>(); var articlecontent = loadedContent.DocumentNode.SelectNodes("//div[@class = 'view_content']").SingleOrDefault(); contentrevision.Details = articlecontent.InnerText.Trim(); contentrevision.Details_Html = articlecontent.InnerHtml.Trim(); contentrevision.isDepricate = false; var imgnodes = articlecontent.SelectNodes(".//img"); contentrevision.SrcDatas = new List <SrcdataDTO>(); if (imgnodes == null) { return; } foreach (var img in imgnodes) { var srcurl = new Uri(img.GetAttributeValue("src", "default")); var srcdata = new SrcdataDTO { SourceUrl = srcurl.AbsoluteUri, IsDepricated = false, FileName = System.IO.Path.GetFileName(srcurl.LocalPath), SrcGuId = Guid.NewGuid(), }; img.SetAttributeValue("guid", srcdata.SrcGuId.ToString()); contentrevision.SrcDatas.Add(srcdata); } } catch (ArgumentNullException) { contentrevision.isDepricate = true; return; } catch (UriFormatException) { return; } catch (Exception e) { Console.WriteLine("ReStart"); ParseContent(contentrevision); } }
//details_html 쪼개는 함수 protected override void ParseContent(ContentRevisionDTO contentrevision) { try { var loadedContent = webGetutf.Load(contentrevision.Content.Contents_URL); var checkifdeprecated = loadedContent.DocumentNode.SelectNodes("//li[@class = 'hx_cate']"); if (checkifdeprecated != null && checkifdeprecated.FirstOrDefault().InnerText.Trim() == "삭제된 글입니다.") { contentrevision.isDepricate = true; return; } var articlecontent = loadedContent.DocumentNode.SelectNodes("//div[@id = 'copy_layer_1']").LastOrDefault(); contentrevision.Details = articlecontent.InnerText.Trim(); contentrevision.Details_Html = articlecontent.InnerHtml.Trim(); contentrevision.isDepricate = false; var imgnodes = articlecontent.SelectNodes(".//img"); contentrevision.SrcDatas = new List <SrcdataDTO>(); if (imgnodes == null) { return; } foreach (var img in imgnodes) { var srcurl = new Uri(img.GetAttributeValue("src", "default")); var srcdata = new SrcdataDTO { SourceUrl = srcurl.AbsoluteUri, IsDepricated = false, FileName = System.IO.Path.GetFileName(srcurl.LocalPath), SrcGuId = Guid.NewGuid(), }; img.SetAttributeValue("guid", srcdata.SrcGuId.ToString()); contentrevision.SrcDatas.Add(srcdata); } } catch (ArgumentNullException) { contentrevision.isDepricate = true; return; } catch (UriFormatException) { return; } catch (Exception e) { Console.WriteLine("ReStart"); ParseContent(contentrevision); } }
//content 내용, html 가져오는 함수 protected override void ParseContent(ContentRevisionDTO contentrevision) { //var content_count = 0; try { var loadedContent = webGetutf.Load(contentrevision.Content.Contents_URL); var articlecontent = loadedContent.DocumentNode.SelectNodes("//div[@id = 'body_frame']").FirstOrDefault(); foreach (var ct in articlecontent.Descendants()) { if (ct.Name == "style") { ct.InnerHtml = ""; } } contentrevision.Details = articlecontent.InnerText.Trim(); contentrevision.Details_Html = articlecontent.InnerHtml.Trim(); contentrevision.isDepricate = false; var imgnodes = articlecontent.SelectNodes("./img"); contentrevision.SrcDatas = new List <SrcdataDTO>(); if (imgnodes == null) { return; } foreach (var img in imgnodes) { var srcurl = new Uri(img.GetAttributeValue("src", "default")); var srcdata = new SrcdataDTO { SourceUrl = srcurl.AbsoluteUri, IsDepricated = false, FileName = System.IO.Path.GetFileName(srcurl.LocalPath), SrcGuId = Guid.NewGuid(), }; img.SetAttributeValue("guid", srcdata.SrcGuId.ToString()); contentrevision.SrcDatas.Add(srcdata); } } catch (ArgumentNullException) { contentrevision.isDepricate = true; return; } catch (UriFormatException) { return; } catch (Exception e) { Console.WriteLine("ReStart"); ParseContent(contentrevision); } }
protected override void ParseContent(ContentRevisionDTO contentrevision) { try { var loadedContent = webGetutf.Load(contentrevision.Content.Contents_URL); var articlecontent = loadedContent.DocumentNode.SelectNodes("//div[@id = 'pann-content']").FirstOrDefault(); contentrevision.Details = articlecontent.InnerText.Trim(); contentrevision.Details_Html = articlecontent.InnerHtml.Trim(); contentrevision.isDepricate = false; var imgnodes = articlecontent.SelectNodes(".//img"); contentrevision.SrcDatas = new List <SrcdataDTO>(); if (imgnodes == null) { return; } foreach (var img in imgnodes) { var srcurl = new Uri(img.GetAttributeValue("src", "default")); var srcdata = new SrcdataDTO { SourceUrl = srcurl.AbsoluteUri, IsDepricated = false, FileName = System.IO.Path.GetFileName(srcurl.LocalPath), SrcGuId = Guid.NewGuid(), }; img.SetAttributeValue("guid", srcdata.SrcGuId.ToString()); contentrevision.SrcDatas.Add(srcdata); } } catch (ArgumentNullException) { contentrevision.isDepricate = true; return; } catch (UriFormatException) { return; } catch (WebException wex) { if (((HttpWebResponse)wex.Response).StatusCode == HttpStatusCode.NotFound) { // error 404, do what you need to do } } catch (Exception e) { Console.WriteLine("ReStart"); ParseContent(contentrevision); } }
protected override void ParseContent(ContentRevisionDTO contentrevision) { try { var ruiwebContents = webGetkr.Load(contentrevision.Content.Contents_URL); var checkifdeprecated = ruiwebContents.DocumentNode.SelectNodes("//td[@class = 'te2']"); if (checkifdeprecated != null && checkifdeprecated.FirstOrDefault().InnerText.Trim() == "이미 삭제 된 게시글 입니다.") { contentrevision.isDepricate = true; return; } //var content_count = 0; List<string> details = new List<string>(); var content = ruiwebContents.DocumentNode.SelectNodes("//div[@id = 'DocContent']").SingleOrDefault(); contentrevision.Details = content.InnerText.Trim(); contentrevision.Details_Html = content.InnerHtml.Trim(); contentrevision.isDepricate = false; var imgnodes = content.SelectNodes(".//img"); contentrevision.SrcDatas = new List<SrcdataDTO>(); if (imgnodes == null) return; foreach (var img in imgnodes) { var srcurl = new Uri(img.GetAttributeValue("src", "default")); var srcdata = new SrcdataDTO { SourceUrl = srcurl.AbsoluteUri, IsDepricated = false, FileName = System.IO.Path.GetFileName(srcurl.LocalPath), SrcGuId = Guid.NewGuid(), }; img.SetAttributeValue("guid", srcdata.SrcGuId.ToString()); contentrevision.SrcDatas.Add(srcdata); } } catch (ArgumentNullException) { contentrevision.isDepricate = true; return; } catch (UriFormatException) { return; } catch (Exception e) { Console.WriteLine("ReStart"); ParseContent(contentrevision); } }