From 3573f6ff5ada02b72b536e23aad3b178a12b8620 Mon Sep 17 00:00:00 2001 From: ErrorNoInternet Date: Sun, 20 Oct 2024 00:16:21 -0400 Subject: [PATCH] feat(cli): add page argument to start scraping from a specific page --- src/args/mod.rs | 6 +++++- src/main.rs | 2 +- 2 files changed, 6 insertions(+), 2 deletions(-) diff --git a/src/args/mod.rs b/src/args/mod.rs index 1056a42..2d1ca97 100644 --- a/src/args/mod.rs +++ b/src/args/mod.rs @@ -14,8 +14,12 @@ pub struct Args { #[arg(short, long)] pub tags: Option>, + /// Page to start scraping from + #[arg(short, long, default_value_t = 1)] + pub page: usize, + /// Async jobs to use for fetching - #[arg(short, long, default_value = "4")] + #[arg(short, long, default_value_t = 4)] pub jobs: usize, /// Delay for rate-limits (ms) diff --git a/src/main.rs b/src/main.rs index c00734c..133dcab 100644 --- a/src/main.rs +++ b/src/main.rs @@ -39,7 +39,7 @@ async fn main() -> ExitCode { .build() .unwrap(); - for page in 0.. { + for page in args.page - 1.. { println!("now scraping page {}", page + 1); println!( "https://rule34.xxx/index.php?page=post&s=list&tags={uri_tags}&pid={}",