-
Notifications
You must be signed in to change notification settings - Fork 206
Expand file tree
/
Copy pathgemini.rs
More file actions
78 lines (67 loc) · 2.52 KB
/
gemini.rs
File metadata and controls
78 lines (67 loc) · 2.52 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
//! `GEMINI_API_KEY=$MYAPI_KEY cargo run --example gemini --features "spider/sync spider/gemini"`
extern crate spider;
use std::time::Duration;
use spider::configuration::{GeminiConfigs, WaitForIdleNetwork};
use spider::features::chrome_common::RequestInterceptConfiguration;
use spider::hashbrown::{HashMap, HashSet};
use spider::website::Website;
use spider::{tokio, CaseInsensitiveString};
#[tokio::main]
async fn main() {
let _ = tokio::fs::create_dir_all("./storage/").await;
let screenshot_params =
spider::configuration::ScreenshotParams::new(Default::default(), Some(true), Some(false));
let screenshot_config =
spider::configuration::ScreenShotConfig::new(screenshot_params, true, true, None);
let website_url = "https://www.google.com";
let mut gemini_config = GeminiConfigs::default();
let prompt_url_map = HashMap::from([
(
CaseInsensitiveString::new(website_url),
Box::new(GeminiConfigs::new(
"gemini-flash-latest",
"Search for Movies",
500,
)),
),
(
CaseInsensitiveString::new(
&((website_url.to_owned()) + "/search/howsearchworks/?fg=1"),
),
Box::new(GeminiConfigs::new(
"gemini-flash-latest",
"Change the background blue",
500,
)),
),
]);
gemini_config.prompt_url_map = Some(Box::new(prompt_url_map));
let mut website: Website = Website::new(website_url)
.with_chrome_intercept(RequestInterceptConfiguration::new(true))
.with_wait_for_idle_network(Some(WaitForIdleNetwork::new(Some(Duration::from_secs(30)))))
.with_screenshot(Some(screenshot_config))
.with_limit(2)
.with_stealth(true)
.with_fingerprint(true)
.with_gemini(Some(gemini_config))
.build()
.unwrap();
let mut rx2 = website.subscribe(16);
website.set_extra_links(HashSet::from([(website_url.to_owned()
+ "/search/howsearchworks/?fg=1")
.into()]));
tokio::spawn(async move {
while let Ok(page) = rx2.recv().await {
println!("{}\n{}", page.get_url(), page.get_html());
}
});
let start = crate::tokio::time::Instant::now();
website.crawl().await;
let duration = start.elapsed();
let links = website.get_all_links_visited().await;
println!(
"Time elapsed in website.crawl() is: {:?} for total pages: {:?}",
duration,
links.len()
)
}