forked from kc3hack/2024_H
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Browse files
Browse the repository at this point in the history
#19 スクレイピング用クライアントを作成
- Loading branch information
Showing
5 changed files
with
149 additions
and
3 deletions.
There are no files selected for viewing
18 changes: 18 additions & 0 deletions
18
Epub/KoeBook.Epub/Contracts/Services/IScrapingClientService.cs
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,18 @@ | ||
using System.Net.Http.Headers; | ||
|
||
namespace KoeBook.Epub.Contracts.Services; | ||
|
||
public interface IScrapingClientService | ||
{ | ||
/// <summary> | ||
/// スクレイピングでGETする用 | ||
/// APIを叩く際は不要 | ||
/// </summary> | ||
Task<string> GetAsStringAsync(string url, CancellationToken ct); | ||
|
||
/// <summary> | ||
/// スクレイピングでGETする用 | ||
/// APIを叩く際は不要 | ||
/// </summary> | ||
Task<ContentDispositionHeaderValue?> GetAsStreamAsync(string url, Stream destination, CancellationToken ct); | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,116 @@ | ||
using System.Net.Http.Headers; | ||
using KoeBook.Epub.Contracts.Services; | ||
|
||
namespace KoeBook.Epub.Services; | ||
|
||
public sealed class ScrapingClientService : IScrapingClientService, IDisposable | ||
{ | ||
private readonly IHttpClientFactory _httpClientFactory; | ||
private readonly PeriodicTimer _periodicTimer; | ||
private readonly Queue<Func<HttpClient, Task>> _actionQueue = []; | ||
private bool _workerActivated; | ||
|
||
public ScrapingClientService(IHttpClientFactory httpClientFactory, TimeProvider timeProvider) | ||
{ | ||
_httpClientFactory = httpClientFactory; | ||
_periodicTimer = new(TimeSpan.FromSeconds(10), timeProvider); | ||
} | ||
|
||
public Task<string> GetAsStringAsync(string url, CancellationToken ct) | ||
{ | ||
var taskCompletion = new TaskCompletionSource<string>(); | ||
|
||
lock (_actionQueue) | ||
_actionQueue.Enqueue(async httpClient => | ||
{ | ||
if (ct.IsCancellationRequested) | ||
taskCompletion.SetCanceled(ct); | ||
try | ||
{ | ||
var response = await httpClient.GetAsync(url, ct).ConfigureAwait(false); | ||
taskCompletion.SetResult(await response.Content.ReadAsStringAsync(ct).ConfigureAwait(false)); | ||
} | ||
catch (Exception ex) | ||
{ | ||
taskCompletion.SetException(ex); | ||
} | ||
}); | ||
|
||
EnsureWorkerActivated(); | ||
|
||
return taskCompletion.Task; | ||
} | ||
|
||
public Task<ContentDispositionHeaderValue?> GetAsStreamAsync(string url, Stream destination, CancellationToken ct) | ||
{ | ||
var taskCompletion = new TaskCompletionSource<ContentDispositionHeaderValue?>(); | ||
|
||
lock (_actionQueue) | ||
_actionQueue.Enqueue(async httpClient => | ||
{ | ||
if (ct.IsCancellationRequested) | ||
taskCompletion.SetCanceled(ct); | ||
try | ||
{ | ||
var response = await httpClient.GetAsync(url, ct).ConfigureAwait(false); | ||
await response.Content.CopyToAsync(destination, ct).ConfigureAwait(false); | ||
taskCompletion.SetResult(response.Content.Headers.ContentDisposition); | ||
} | ||
catch (Exception ex) | ||
{ | ||
taskCompletion.SetException(ex); | ||
} | ||
}); | ||
|
||
EnsureWorkerActivated(); | ||
|
||
return taskCompletion.Task; | ||
} | ||
|
||
/// <summary> | ||
/// <see cref="Worker"/>が起動していない場合は起動します | ||
/// </summary> | ||
private void EnsureWorkerActivated() | ||
{ | ||
bool activateWorker; | ||
lock (_actionQueue) activateWorker = !_workerActivated; | ||
|
||
if (activateWorker) | ||
Worker(); | ||
} | ||
|
||
/// <summary> | ||
/// <see cref="_actionQueue"/>のConsumer | ||
/// 別スレッドでループさせるためにvoid | ||
/// </summary> | ||
private async void Worker() | ||
{ | ||
lock (_actionQueue) | ||
_workerActivated = true; | ||
|
||
try | ||
{ | ||
while (await _periodicTimer.WaitForNextTickAsync().ConfigureAwait(false) && _actionQueue.Count > 0) | ||
{ | ||
Func<HttpClient, Task>? action; | ||
lock (_actionQueue) | ||
if (!_actionQueue.TryDequeue(out action)) | ||
continue; | ||
|
||
await action(_httpClientFactory.CreateClient()).ConfigureAwait(ConfigureAwaitOptions.SuppressThrowing); | ||
} | ||
} | ||
finally | ||
{ | ||
lock (_actionQueue) | ||
_workerActivated = false; | ||
} | ||
} | ||
|
||
public void Dispose() | ||
{ | ||
_periodicTimer.Dispose(); | ||
} | ||
} |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters