-
Notifications
You must be signed in to change notification settings - Fork 1k
/
Copy pathBaseUsageSpider.cs
56 lines (50 loc) · 1.58 KB
/
BaseUsageSpider.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
using System.ComponentModel;
using System.Threading;
using System.Threading.Tasks;
using DotnetSpider.DataFlow;
using DotnetSpider.DataFlow.Parser;
using DotnetSpider.Http;
using DotnetSpider.Selector;
using Microsoft.Extensions.Hosting;
using Microsoft.Extensions.Logging;
using Microsoft.Extensions.Options;
using Serilog;
namespace DotnetSpider.Sample.samples;
[DisplayName(displayName: "博客园")]
public class BaseUsageSpider(
IOptions<SpiderOptions> options,
DependenceServices services,
ILogger<Spider> logger)
: Spider(options, services, logger)
{
public static async Task RunAsync()
{
var builder = Builder.CreateDefaultBuilder<BaseUsageSpider>(x =>
{
x.Speed = 5;
});
builder.UseSerilog();
await builder.Build().RunAsync();
}
class MyDataParser : DataParser
{
protected override Task ParseAsync(DataFlowContext context)
{
context.AddData("URL", context.Request.RequestUri);
context.AddData("Title", context.Selectable.XPath(".//title")?.Value);
return Task.CompletedTask;
}
public override Task InitializeAsync()
{
AddRequiredValidator("cnblogs\\.com");
AddFollowRequestQuerier(Selectors.XPath("."));
return Task.CompletedTask;
}
}
protected override async Task InitializeAsync(CancellationToken stoppingToken = default)
{
await AddRequestsAsync(new Request("http://www.cnblogs.com/"));
AddDataFlow<MyDataParser>();
AddDataFlow<ConsoleStorage>();
}
}