Exemplo n.º 1
0
        static void Main(string[] args)
        {
            DiningWebpageParser parser = new DiningWebpageParser("http://www.davenport.edu/dining/dining-hall/weeks-menu");
            MenuPdfParser pdfParser = new MenuPdfParser(parser.PdfList);

            foreach (var menu in pdfParser.Menus)
            {
                Console.WriteLine(menu);
            }

            Console.ReadLine();
        }
Exemplo n.º 2
0
        public void UpdateMenus()
        {
            DiningWebpageParser parser = new DiningWebpageParser("http://www.davenport.edu/dining/dining-hall/weeks-menu");
            this.Log().Info("Webpage parser completed, {0} pdfs found", parser.PdfList.Count);

            MenuPdfParser pdfParser = new MenuPdfParser(parser.PdfList);
            this.Log().Info("PDF Parser completed, {0} menus loaded with {1} items", pdfParser.Menus.Count, pdfParser.Menus.Sum(d=>d.AllMeals.Count));

            if (!MenuDbRepository.Current.IsInitialized)
            {
                return;
            }

            foreach (var m in pdfParser.Menus)
            {
                MenuDbRepository.Current.UpsertMenu(m.Date, JsonConvert.SerializeObject(m.DailyMeals));

                using (WebClient client = new WebClient())
                {
                    Directory.CreateDirectory("images");

                    foreach (string srcItem in m.AllMeals.Where(item => !File.Exists(Path.Combine("images", item + ".jpg"))))
                    {
                        if (SkipImages)
                        {
                            this.Log().Info("Skipping image for {0}", srcItem);
                            continue;
                        }

                        Regex rgx = new Regex("[^a-zA-Z0-9 -]", RegexOptions.Compiled);
                        string item = rgx.Replace(srcItem, "");

                        try
                        {
                            int resultCount = 0;
                            List<string> results = SearchResult.FindImageForQuery(item);

                            if (results == null || results.Count == 0)
                            {
                                this.Log().Error("Could not find any results for " + item);
                                continue;
                            }

                            string result = results[resultCount];

                            while (!DownloadImage(item, result))
                            {
                                this.Log().Error("Could not download image for " + item + ", try "+(resultCount + 1));
                                resultCount++;
                                result = results[resultCount];
                            }
                        }
                        catch (WebException)
                        {
                            this.Log().Error("Could not query image for "+item);
                        }

                    }
                }
            }
        }