-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathDataParser.cs
81 lines (65 loc) · 2.2 KB
/
DataParser.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
using System;
using System.Collections.Generic;
using System.Linq;
using System.Net.Http;
using System.Threading.Tasks;
namespace cgamos
{
internal static class DataParser
{
public static async ValueTask<PageData> GetPageData(ArchiveRecord record)
{
var client = new HttpClient();
var urlVariants = UrlMutatuinHelper.GetUrlVariants(record).ToArray();
foreach (var urlVariant in urlVariants)
{
try
{
var body = await client.GetStringAsync(urlVariant);
var pageUrls = GetPageUrls(body);
if (!pageUrls.Any())
{
continue;
}
return new PageData(pageUrls, pageUrls.Count, urlVariant);
}
catch (HttpRequestException)
{
continue;
}
catch (Exception)
{
return null;
}
}
return null;
}
private static IReadOnlyCollection<string> GetPageUrls(string body)
{
var urls = new List<string>();
const string dataSrcToken = "<img data-src=\"";
const string resizeToken = "resize";
var position = 0;
while (position >= 0)
{
//<li class="swiper-slide" data-count="5" style="width: 596px; margin-right: 12px;" role="group" aria-label="6 / 1612">
//<img data-src="/images/MB_LS/01-0203-0745-001743/00000006.jpg">
//</li>
position = body.IndexOf(dataSrcToken, position + dataSrcToken.Length);
if (position == -1)
{
break;
}
var start = position + dataSrcToken.Length;
var end = body.IndexOf("\"", start);
var str = body[start..end];
if (str.Contains(resizeToken))
{
continue;
}
urls.Add(str);
}
return urls;
}
}
}