-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathUpdateDb.cs
94 lines (71 loc) · 2.91 KB
/
UpdateDb.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
using System;
using System.Collections.Generic;
using System.IO;
using System.Linq;
using System.Net;
using System.Text;
using HtmlAgilityPack;
namespace randombg_dotnet{
public static class UpdateDb{
public static void Run(Database db){
List<ImageRecord> recs = GetWebBasedRecords();
db.InsertNewRecords("images", recs.Cast<IDbRecord>());
db.Save();
}
private static List<ImageRecord> GetWebBasedRecords(){
List<ImageRecord> result = new List<ImageRecord>();
foreach(string cat in Globals.SourceImageCategories)
result.AddRange(GetCategoryImageRecords(cat));
return result;
}
private static IEnumerable<ImageRecord> GetCategoryImageRecords(string cat){
LinkedList<ImageRecord> result = new LinkedList<ImageRecord>();
Console.WriteLine($"Fetching {cat}...");
int pagenum = 1;
bool keepGoing = true;
do{
try{
string pageUrl = GetPageUrl(cat, pagenum);
IEnumerable<string> imgPaths = GetPageImagePaths(pageUrl);
foreach(string path in imgPaths)
result.AddLast(CreateImageRecord(cat, path));
pagenum++;
} catch (Exception ex){
keepGoing = false;
}
}while(keepGoing);
return result;
}
private static string GetPageUrl(string cat, int pagenum)
{
string result =
$"{Globals.WEB_SOURCE_BASE_URL}/wallcat/{cat}/?";
result = (pagenum > 1) ?
result.Replace("?", $"index{pagenum}.html"):
result.Replace("?", "index.html");
return result;
}
private static IEnumerable<string> GetPageImagePaths(string url){
LinkedList<string> result = new LinkedList<string>();
var web = new HtmlWeb();
var body = web.Load(url).DocumentNode.SelectSingleNode("//body");
var imgnodes = body.SelectNodes("//div/table/tr/td/table/tr/td/a");
foreach(var node in imgnodes){
var img = node.Elements("img").FirstOrDefault();
if (img != null){
var tmbPath = img.Attributes["src"].Value;
var imgPath = tmbPath
.Replace("tmb/","img/")
.Replace("/tmb","/img");
result.AddLast(imgPath);
}
}
return result;
}
private static ImageRecord CreateImageRecord(string cat, string path){
string fullUrl = $"{Globals.WEB_SOURCE_BASE_URL}{path}";
string imgName = path.Substring(path.IndexOf('_') + 1);
return new ImageRecord(false, imgName, fullUrl);
}
}
}