Example #1
0
        private void Redownload_Click(object sender, EventArgs e)
        {
            TheNumbersDataContext dc = new TheNumbersDataContext();
            var errors = dc.Errors.DistinctBy(x => x.link);

            foreach (var error in errors)
            {
                dc.ExecuteCommand("TRUNCATE TABLE [dbo].[log]"); // clears the log first.
                SingleMovieLink tempsml = new SingleMovieLink(error.link, error.year);
                dc.Connection.Close();
                tempsml.GetMovie();
                if (dc.Connection.State.Equals(ConnectionState.Closed))
                {
                    dc.Connection.Open();
                }
                if (!dc.IsThereAnyError())
                {
                    var tempdelete = dc.Errors.Where(err => err.link.Equals(error.link));
                    dc.Errors.DeleteAllOnSubmit(tempdelete);
                    dc.SubmitChanges();
                }
            }
        }
Example #2
0
        private void btnDownload_Click(object sender, EventArgs e)
        {
            TheNumbersDataContext dc = new TheNumbersDataContext();

            dc.ExecuteCommand("TRUNCATE TABLE [dbo].[log]"); // clears the log first.

            Helper.WriteToLog(ProgramStatus.Start);
            if (rbAll.Checked)
            {
                // get all years listed
                List <String> years = new List <string>();

                var  yearListPage = new HtmlAgilityPack.HtmlDocument();
                bool downloaded   = false;
                int  count        = 0;
                while (!downloaded)
                {
                    try
                    {
                        yearListPage.LoadHtml(Helper.GetHTML(@"http://www.the-numbers.com/movies/#tab=year"));
                        downloaded = true;
                    }
                    catch
                    {
                        downloaded = false;
                        count++;
                        if (count >= 3)
                        {
                            Helper.WriteToLog(ProgramStatus.Error, "error loading the entire page");
                        }
                        else
                        {
                            Task.Delay(5000); // add sleep for 5 sec to delay the fetch
                        }
                    }
                }
                // download all
                if (downloaded)
                {
                    // get year list.
                    var table = yearListPage.DocumentNode.Descendants("div").Single(
                        o => o.HasAttributes && o.Attributes.Any(p => p.Name.Equals("id")) &&
                        o.Attributes["id"].Value.Equals("year"))
                                .Descendants("table").FirstOrDefault();
                    var trs = table.Descendants("tr").Reverse().ToList();
                    trs.Remove(trs.Last());

                    foreach (var tr in trs)
                    {
                        years.Add(tr.Descendants("td").FirstOrDefault().Descendants("b")
                                  .FirstOrDefault().Descendants("a")
                                  .FirstOrDefault().InnerText.Trim());
                    }

                    foreach (string year in years)
                    {
                        this.GetASingleYear(year);
                    }
                    MessageBox.Show("Whole database successfully stored to DB!");
                }
                MessageBox.Show("All successfully stored to DB!");
            }
            else
            {
                this.GetASingleYear(txtYear.Text);
                MessageBox.Show("Year " + txtYear.Text + " successfully stored to DB!");
            }
            if (dc.Errors.Count() > 0)
            {
                MessageBox.Show("Scrapping completed with error. Please send the entire log from DB to [email protected]");
            }
            Helper.WriteToLog(ProgramStatus.End);
        }