static int CompareDeleteLogEvents(DeleteLogEvent x, DeleteLogEvent y) { return y.Timestamp.CompareTo(x.Timestamp); }
public void Run(Wiki wiki) { Directory.CreateDirectory(_cacheDir); Console.Out.WriteLine("Updating " + _page); Regex wikiLinkRE = new Regex(@"\[{2}(.+?)(\|.+?)?]{2}"); Regex timeRE = new Regex(@"(\d{2}:\d{2}\, \d\d? [а-я]+ \d{4}) \(UTC\)"); ParameterCollection parameters = new ParameterCollection(); parameters.Add("prop", "info|revisions"); parameters.Add("intoken", "edit"); XmlDocument doc = wiki.Query(QueryBy.Titles, parameters, _page); XmlNode page = doc.SelectSingleNode("//page"); string queryTimestamp = DateTime.Now.ToUniversalTime().ToString("yyyy-MM-ddTHH:mm:ssZ"); string pageName = page.Attributes["title"].Value; string basetimestamp = page.FirstChild.FirstChild.Attributes["timestamp"].Value; string editToken = page.Attributes["edittoken"].Value; string starttimestamp = queryTimestamp; string text = ""; string fileName = _cacheDir + WikiCache.EscapePath(_page); if (File.Exists(fileName)) { using (FileStream fs = new FileStream(fileName, FileMode.Open)) using (GZipStream gs = new GZipStream(fs, CompressionMode.Decompress)) using (TextReader sr = new StreamReader(gs)) { string revid = sr.ReadLine(); if (revid == page.Attributes["lastrevid"].Value) { Console.Out.WriteLine("Loading " + pageName + "..."); text = sr.ReadToEnd(); } } } if (string.IsNullOrEmpty(text)) { Console.Out.WriteLine("Downloading " + pageName + "..."); text = wiki.LoadText(pageName); starttimestamp = DateTime.Now.ToUniversalTime().ToString("yyyy-MM-ddTHH:mm:ssZ"); using (FileStream fs = new FileStream(fileName, FileMode.Create)) using (GZipStream gs = new GZipStream(fs, CompressionMode.Compress)) using (StreamWriter sw = new StreamWriter(gs)) { sw.WriteLine(page.Attributes["lastrevid"].Value); sw.Write(text); } } Dictionary<string, List<WikiPageSection>> titles = new Dictionary<string, List<WikiPageSection>>(); WikiPage wikiPage = WikiPage.Parse(pageName, text); foreach (WikiPageSection section in wikiPage.Sections) { if (section.Subsections.Count(s => s.Title.ToLower(CultureInfo.CreateSpecificCulture("ru-RU")).Trim() == "итог") == 0) { Match m = wikiLinkRE.Match(section.Title); if (m.Success) { string title = m.Groups[1].Value.Trim(); if (titles.ContainsKey(title)) { titles[title].Add(section); } else { titles.Add(title, new List<WikiPageSection>()); titles[title].Add(section); } } } } parameters.Clear(); parameters.Add("prop", "info"); Dictionary<string, string> normalizedTitles = new Dictionary<string, string>(); XmlDocument xml = wiki.Query(QueryBy.Titles, parameters, titles.Keys); foreach (XmlNode node in xml.SelectNodes("//n")) { normalizedTitles.Add(node.Attributes["to"].Value, node.Attributes["from"].Value); } List<string> notificationList = new List<string>(); XmlNodeList missingTitles = xml.SelectNodes("//page"); foreach (XmlNode node in missingTitles) { string title = node.Attributes["title"].Value; IEnumerable<WikiPageSection> sections; if (titles.ContainsKey(title)) { sections = titles[title]; } else { sections = titles[normalizedTitles[title]]; } if (node.Attributes["missing"] != null) { parameters.Clear(); parameters.Add("list", "logevents"); parameters.Add("letype", "delete"); parameters.Add("lemlimit", "max"); parameters.Add("ledir", "newer"); parameters.Add("letitle", title); parameters.Add("leprop", "comment|type|user|timestamp"); XmlDocument log = wiki.Enumerate(parameters, true); XmlNodeList items = log.SelectNodes("//item"); List<DeleteLogEvent> events = new List<DeleteLogEvent>(); foreach (XmlNode item in items) { DeleteLogEvent ev = new DeleteLogEvent(); ev.Comment = item.Attributes["comment"].Value; ev.Deleted = item.Attributes["action"].Value == "delete"; ev.User = item.Attributes["user"].Value; ev.Timestamp = DateTime.Parse(item.Attributes["timestamp"].Value, null, DateTimeStyles.AssumeUniversal); events.Add(ev); } events.Sort(CompareDeleteLogEvents); if (events.Count > 0 && events[0].Deleted) { string comment = FilterWikiMarkup(events[0].Comment); string message = string.Format("Страница была удалена {1} администратором [[User:{0}|]]. Была указана следующая причина: «{2}». Данное сообщение было автоматически сгенерировано ботом ~~~~.\n", events[0].User, events[0].Timestamp.ToUniversalTime().ToString("d MMMM yyyy в HH:mm (UTC)", CultureInfo.CreateSpecificCulture("ru-RU")), comment); var pageSections = titles.ContainsKey(title) ? titles[title] : titles[normalizedTitles[title]]; foreach (WikiPageSection section in pageSections) { WikiPageSection verdict = new WikiPageSection(" Итог ", section.Level + 1, message); section.AddSubsection(verdict); } } } } string newText = wikiPage.Text; if (newText.Trim() == text.Trim()) { return; } Console.Out.WriteLine("Updating " + pageName + "..."); string id = wiki.Save(pageName, "", newText, "автоматическое подведение итогов", MinorFlags.Minor, CreateFlags.NoCreate, WatchFlags.None, SaveFlags.Replace, true, basetimestamp, "", editToken); using (FileStream fs = new FileStream(fileName, FileMode.Create)) using (GZipStream gs = new GZipStream(fs, CompressionMode.Compress)) using (StreamWriter sw = new StreamWriter(gs)) { sw.WriteLine(id); sw.Write(newText); } }
public void UpdatePages(Wiki wiki) { Console.Out.WriteLine("Updating articles for deletion..."); Regex wikiLinkRE = new Regex(@"\[{2}(.+?)(\|.+?)?]{2}"); Regex timeRE = new Regex(@"(\d{2}:\d{2}\, \d\d? [а-я]+ \d{4}) \(UTC\)"); ParameterCollection parameters = new ParameterCollection(); parameters.Add("generator", "categorymembers"); parameters.Add("gcmtitle", _l10i.Category); parameters.Add("gcmlimit", "max"); parameters.Add("gcmnamespace", "4"); parameters.Add("prop", "info|revisions"); parameters.Add("intoken", "edit"); XmlDocument doc = wiki.Enumerate(parameters, true); string queryTimestamp = DateTime.Now.ToUniversalTime().ToString("yyyy-MM-ddTHH:mm:ssZ"); XmlNodeList pages = doc.SelectNodes("//page"); foreach (XmlNode page in pages) { string starttimestamp = queryTimestamp; int results = 0; string prefix = _l10i.MainPage + "/"; string pageName = page.Attributes["title"].Value; string basetimestamp = page.FirstChild.FirstChild.Attributes["timestamp"].Value; string editToken = page.Attributes["edittoken"].Value; if (pageName.Length < prefix.Length) { continue; } string date = pageName.Substring(prefix.Length); Day day = new Day(); if (!DateTime.TryParse(date, CultureInfo.CreateSpecificCulture(_l10i.Culture), DateTimeStyles.AssumeUniversal, out day.Date)) { continue; } string text = ""; string fileName = _cacheDir + date + ".bin"; if (File.Exists(fileName)) { using (FileStream fs = new FileStream(fileName, FileMode.Open)) using (GZipStream gs = new GZipStream(fs, CompressionMode.Decompress)) using (TextReader sr = new StreamReader(gs)) { string revid = sr.ReadLine(); if (revid == page.Attributes["lastrevid"].Value) { Console.Out.WriteLine("Loading " + pageName + "..."); text = sr.ReadToEnd(); } } } if (string.IsNullOrEmpty(text)) { try { Console.Out.WriteLine("Downloading " + pageName + "..."); text = wiki.LoadText(pageName); starttimestamp = DateTime.Now.ToUniversalTime().ToString("yyyy-MM-ddTHH:mm:ssZ"); } catch (WikiPageNotFound) { continue; } using (FileStream fs = new FileStream(fileName, FileMode.Create)) using (GZipStream gs = new GZipStream(fs, CompressionMode.Compress)) using (StreamWriter sw = new StreamWriter(gs)) { sw.WriteLine(page.Attributes["lastrevid"].Value); sw.Write(text); } } List<string> titlesWithResults = new List<string>(); Dictionary<string, List<WikiPageSection>> titles = new Dictionary<string, List<WikiPageSection>>(); day.Page = WikiPage.Parse(pageName, text); foreach (WikiPageSection section in day.Page.Sections) { ReplaceEmptyResults(section); RemoveStrikeOut(section); StrikeOutSection(section); if (section.Subsections.Count(s => _l10i.Processor != null ? _l10i.Results.Any(r => r == _l10i.Processor(s).Trim()) : _l10i.Results.Any(r => r == s.Title.Trim())) == 0 && section.Subsections.Count(s => s.Title.Trim() == _l10i.ChallengedResult) == 0) { Match m = wikiLinkRE.Match(section.Title); if (m.Success) { string title = m.Groups[1].Value.Trim(); if (titles.ContainsKey(title)) { titles[title].Add(section); } else { titles.Add(title, new List<WikiPageSection>()); titles[title].Add(section); } } } { Match m = wikiLinkRE.Match(section.Title); if (m.Success && section.Title.Contains("<s>")) { titlesWithResults.Add(m.Groups[1].Value.Trim()); } List<WikiPageSection> sections = new List<WikiPageSection>(); section.Reduce(sections, SubsectionsList); foreach (WikiPageSection subsection in sections) { m = wikiLinkRE.Match(subsection.Title); if (m.Success && subsection.Title.Contains("<s>")) { titlesWithResults.Add(m.Groups[1].Value.Trim()); } if (m.Success && !subsection.Title.Contains("<s>") && subsection.Subsections.Count(s => s.Title.Trim() == _l10i.ChallengedResult) == 0 && subsection.Subsections.Count(s => _l10i.Processor != null ? _l10i.Results.Any(r => r == _l10i.Processor(s).Trim()) : _l10i.Results.Any(r => r == s.Title.Trim())) == 0) { string title = m.Groups[1].Value.Trim(); if (titles.ContainsKey(title)) { titles[title].Add(subsection); } else { titles.Add(title, new List<WikiPageSection>()); titles[title].Add(subsection); } } } } } parameters.Clear(); parameters.Add("prop", "info"); Dictionary<string, string> normalizedTitles = new Dictionary<string, string>(); XmlDocument xml = wiki.Query(QueryBy.Titles, parameters, titles.Keys); foreach (XmlNode node in xml.SelectNodes("//n")) { normalizedTitles.Add(node.Attributes["to"].Value, node.Attributes["from"].Value); } List<string> notificationList = new List<string>(); XmlNodeList missingTitles = xml.SelectNodes("//page"); foreach (XmlNode node in missingTitles) { string title = node.Attributes["title"].Value; IEnumerable<WikiPageSection> sections; if (titles.ContainsKey(title)) { sections = titles[title]; } else { sections = titles[normalizedTitles[title]]; } if (node.Attributes["missing"] != null) { DateTime start = day.Date; //foreach (WikiPageSection section in sections) //{ // Match m = timeRE.Match(section.Text); // if (m.Success) // { // start = DateTime.Parse(m.Groups[1].Value, // CultureInfo.CreateSpecificCulture(_l10i.Culture), // DateTimeStyles.AssumeUniversal); // } //} parameters.Clear(); parameters.Add("list", "logevents"); parameters.Add("letype", "delete"); parameters.Add("lemlimit", "max"); parameters.Add("lestart", start.ToUniversalTime().ToString("yyyy-MM-ddTHH:mm:ssZ")); parameters.Add("ledir", "newer"); parameters.Add("letitle", title); parameters.Add("leprop", "comment|type|user|timestamp"); XmlDocument log = wiki.Enumerate(parameters, true); XmlNodeList items = log.SelectNodes("//item"); List<DeleteLogEvent> events = new List<DeleteLogEvent>(); foreach (XmlNode item in items) { DeleteLogEvent ev = new DeleteLogEvent(); ev.Comment = item.Attributes["comment"].Value; ev.Deleted = item.Attributes["action"].Value == "delete"; ev.User = item.Attributes["user"].Value; ev.Timestamp = DateTime.Parse(item.Attributes["timestamp"].Value, null, DateTimeStyles.AssumeUniversal); events.Add(ev); } events.Sort(CompareDeleteLogEvents); if (events.Count > 0 && events[0].Deleted && (DateTime.Now - events[0].Timestamp).TotalHours > 2) { string comment = FilterWikiMarkup(events[0].Comment); string message = string.Format(_l10i.AutoResultMessage, events[0].User, events[0].Timestamp.ToUniversalTime().ToString(_l10i.DateFormat, CultureInfo.CreateSpecificCulture(_l10i.Culture)), comment); var pageSections = titles.ContainsKey(title) ? titles[title] : titles[normalizedTitles[title]]; foreach (WikiPageSection section in pageSections) { WikiPageSection verdict = new WikiPageSection(" " + _l10i.AutoResultSection + " ", section.Level + 1, message); section.AddSubsection(verdict); StrikeOutSection(section); ++results; } } } } if (_l10i.Culture != "ru-RU") { parameters.Clear(); parameters.Add("prop", "info"); xml = wiki.Query(QueryBy.Titles, parameters, titlesWithResults); foreach (XmlNode node in xml.SelectNodes("//page")) { if (node.Attributes["missing"] == null && node.Attributes["redirect"] == null && node.Attributes["ns"].Value == "0") { notificationList.Add(node.Attributes["title"].Value); } } if (notificationList.Count > 0) { parameters.Clear(); parameters.Add("list", "backlinks"); parameters.Add("bltitle", pageName); parameters.Add("blfilterredir", "nonredirects"); parameters.Add("blnamespace", "1"); parameters.Add("bllimit", "max"); XmlDocument backlinks = wiki.Enumerate(parameters, true); foreach (string title in notificationList) { string talkPage = wiki.GetNamespace(1) + ":" + title; if (backlinks.SelectSingleNode("//bl[@title=" + GenerateConcatForXPath(talkPage) + "]") == null) { PutNotification(wiki, title, date); } } } } string newText = day.Page.Text; if (newText.Trim() == text.Trim()) { continue; } try { Console.Out.WriteLine("Updating " + pageName + "..."); string revid = wiki.Save(pageName, "", newText, _l10i.StrikeOutComment + (results > 0 ? _l10i.AutoResultComment : ""), MinorFlags.Minor, CreateFlags.NoCreate, WatchFlags.None, SaveFlags.Replace, true, basetimestamp, "", editToken); using (FileStream fs = new FileStream(fileName, FileMode.Create)) using (GZipStream gs = new GZipStream(fs, CompressionMode.Compress)) using (StreamWriter sw = new StreamWriter(gs)) { sw.WriteLine(revid); sw.Write(newText); } } catch (WikiException) { } } }
internal void UpdatePages(Wiki wiki) { ParameterCollection parameters = new ParameterCollection(); parameters.Add("generator", "categorymembers"); parameters.Add("gcmtitle", "Категория:Википедия:Незакрытые обсуждения восстановления страниц"); parameters.Add("gcmlimit", "max"); parameters.Add("gcmnamespace", "4"); parameters.Add("prop", "info|revisions"); parameters.Add("intoken", "edit"); XmlDocument doc = wiki.Enumerate(parameters, true); string queryTimestamp = DateTime.Now.ToUniversalTime().ToString("yyyy-MM-ddTHH:mm:ssZ"); XmlNodeList pages = doc.SelectNodes("//page"); foreach (XmlNode page in pages) { string starttimestamp = queryTimestamp; int results = 0; string prefix = "Википедия:К восстановлению/"; string pageName = page.Attributes["title"].Value; string basetimestamp = page.FirstChild.FirstChild.Attributes["timestamp"].Value; string editToken = page.Attributes["edittoken"].Value; string date = pageName.Substring(prefix.Length); Day day = new Day(); if (!DateTime.TryParse(date, CultureInfo.CreateSpecificCulture("ru-RU"), DateTimeStyles.AssumeUniversal, out day.Date)) { continue; } string text = ""; string fileName = _cacheDir + date + ".bin"; if (File.Exists(fileName)) { using (FileStream fs = new FileStream(fileName, FileMode.Open)) using (GZipStream gs = new GZipStream(fs, CompressionMode.Decompress)) using (TextReader sr = new StreamReader(gs)) { string revid = sr.ReadLine(); if (revid == page.Attributes["lastrevid"].Value) { Console.Out.WriteLine("Loading " + pageName + "..."); text = sr.ReadToEnd(); } } } if (string.IsNullOrEmpty(text)) { try { Console.Out.WriteLine("Downloading " + pageName + "..."); text = wiki.LoadText(pageName); starttimestamp = DateTime.Now.ToUniversalTime().ToString("yyyy-MM-ddTHH:mm:ssZ"); } catch (WikiPageNotFound) { continue; } using (FileStream fs = new FileStream(fileName, FileMode.Create)) using (GZipStream gs = new GZipStream(fs, CompressionMode.Compress)) using (StreamWriter sw = new StreamWriter(gs)) { sw.WriteLine(page.Attributes["lastrevid"].Value); sw.Write(text); } } Dictionary<string, List<WikiPageSection>> titles = new Dictionary<string, List<WikiPageSection>>(); day.Page = WikiPage.Parse(pageName, text); foreach (WikiPageSection section in day.Page.Sections) { RemoveStrikeOut(section); StrikeOutSection(section); if (section.Subsections.Count(s => _results.Any(r => r.ToLower() == s.Title.Trim().ToLower())) == 0) { Match m = _wikiLinkRE.Match(section.Title); if (m.Success) { string title = m.Groups[1].Value.Trim(); if (titles.ContainsKey(title)) { titles[title].Add(section); } else { titles.Add(title, new List<WikiPageSection>()); titles[title].Add(section); } } } { List<WikiPageSection> sections = new List<WikiPageSection>(); section.Reduce(sections, SubsectionsList); foreach (WikiPageSection subsection in sections) { Match m = _wikiLinkRE.Match(subsection.Title); if (m.Success && !subsection.Title.Contains("<s>") && subsection.Subsections.Count(s => _results.Any(r => r.ToLower() == s.Title.Trim().ToLower())) == 0) { string title = m.Groups[1].Value.Trim(); if (titles.ContainsKey(title)) { titles[title].Add(subsection); } else { titles.Add(title, new List<WikiPageSection>()); titles[title].Add(subsection); } } } } } parameters.Clear(); parameters.Add("prop", "info"); Dictionary<string, string> normalizedTitles = new Dictionary<string, string>(); XmlDocument xml = wiki.Query(QueryBy.Titles, parameters, titles.Keys); foreach (XmlNode node in xml.SelectNodes("//n")) { normalizedTitles.Add(node.Attributes["to"].Value, node.Attributes["from"].Value); } List<string> notificationList = new List<string>(); XmlNodeList missingTitles = xml.SelectNodes("//page"); foreach (XmlNode node in missingTitles) { string title = node.Attributes["title"].Value; IEnumerable<WikiPageSection> sections; if (titles.ContainsKey(title)) { sections = titles[title]; } else { sections = titles[normalizedTitles[title]]; } if (node.Attributes["missing"] == null) { DateTime start = day.Date; parameters.Clear(); parameters.Add("list", "logevents"); parameters.Add("letype", "delete"); parameters.Add("lemlimit", "max"); parameters.Add("lestart", start.ToUniversalTime().ToString("yyyy-MM-ddTHH:mm:ssZ")); parameters.Add("ledir", "newer"); parameters.Add("letitle", title); parameters.Add("leprop", "comment|type|user|timestamp"); XmlDocument log = wiki.Enumerate(parameters, true); XmlNodeList items = log.SelectNodes("//item"); List<DeleteLogEvent> events = new List<DeleteLogEvent>(); foreach (XmlNode item in items) { DeleteLogEvent ev = new DeleteLogEvent(); ev.Comment = item.Attributes["comment"].Value; ev.Restored = item.Attributes["action"].Value == "restore"; ev.Deleted = item.Attributes["action"].Value == "delete"; ev.User = item.Attributes["user"].Value; ev.Timestamp = DateTime.Parse(item.Attributes["timestamp"].Value, null, DateTimeStyles.AssumeUniversal); events.Add(ev); } events.Sort(CompareDeleteLogEvents); if (events.Count > 0 && events[0].Restored && (DateTime.Now - events[0].Timestamp).TotalHours > 2) { Regex commentRE = new Regex(@" восстановлено: (.+)"); Match m = commentRE.Match(events[0].Comment); string comment; if (m.Success) { comment = m.Groups[1].Value; } else { comment = "<nowiki>" + events[0].Comment + "</nowiki>"; } string message = string.Format("Страница была восстановлена {1} администратором [[User:{0}|]]. Была указана следующая причина: «{2}». Данное сообщение было автоматически сгенерировано ботом ~~~~.\n", events[0].User, events[0].Timestamp.ToUniversalTime().ToString("d MMMM yyyy в HH:mm (UTC)"), comment); if (!titles.ContainsKey(title)) { continue; } foreach (WikiPageSection section in titles[title]) { WikiPageSection verdict = new WikiPageSection(" Автоматический итог ", section.Level + 1, message); section.AddSubsection(verdict); StrikeOutSection(section); ++results; } } else if (events.Count > 0 && events[0].Deleted) { parameters.Clear(); parameters.Add("prop", "revisions"); parameters.Add("rvprop", "timestamp|user"); parameters.Add("rvdir", "newer"); parameters.Add("rvlimit", "1"); parameters.Add("redirects"); log = wiki.Query(QueryBy.Titles, parameters, new string[] { title }); XmlNode revision = log.SelectSingleNode("//rev"); if (revision != null) { string user = revision.Attributes["user"].Value; string timestamp = revision.Attributes["timestamp"].Value; DateTime time = DateTime.Parse(timestamp, null, DateTimeStyles.AssumeUniversal); string message = string.Format("Страница была создана заново {1} участником [[User:{0}|]]. Данное сообщение было автоматически сгенерировано ботом ~~~~.\n", user, time.ToUniversalTime().ToString("d MMMM yyyy в HH:mm (UTC)")); if (!titles.ContainsKey(title)) { continue; } foreach (WikiPageSection section in titles[title]) { WikiPageSection verdict = new WikiPageSection(" Автоматический итог ", section.Level + 1, message); section.AddSubsection(verdict); StrikeOutSection(section); ++results; } } } } } string newText = day.Page.Text; if (newText.Trim() == text.Trim()) { continue; } try { Console.Out.WriteLine("Updating " + pageName + "..."); string revid = wiki.Save(pageName, "", newText, "зачёркивание заголовков" + (results > 0 ? " и подведение итогов" : ""), MinorFlags.Minor, CreateFlags.NoCreate, WatchFlags.None, SaveFlags.Replace, true, basetimestamp, "", editToken); using (FileStream fs = new FileStream(fileName, FileMode.Create)) using (GZipStream gs = new GZipStream(fs, CompressionMode.Compress)) using (StreamWriter sw = new StreamWriter(gs)) { sw.WriteLine(revid); sw.Write(newText); } } catch (WikiException) { } } }