1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
|
use crate::cookies::CookieStore;
use anyhow::Result;
use reqwest::header::{
HeaderMap, HeaderValue, ACCEPT, ACCEPT_ENCODING, COOKIE, REFERER, USER_AGENT,
};
use reqwest::Client;
/// Minimal HTTP client wrapper.
/// - Cookies are injected into the default `Cookie:` header.
/// - A few "browser-like" headers are pre-set (matching the spirit of the Python script).
pub struct HttpClient {
client: Client,
/// Kept for tests and internal checks; **do not log** this in production logs.
cookie_header: String,
}
impl HttpClient {
/// Build a HeaderMap with static browser-like values and an explicit Cookie header.
fn build_default_headers(cookie_header: &str) -> Result<HeaderMap> {
let mut headers = HeaderMap::new();
// User-Agent: a modern desktop UA string (no device-specific flags).
headers.insert(
USER_AGENT,
HeaderValue::from_static(
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 \
(KHTML, like Gecko) Chrome/122.0.0.0 Safari/537.36",
),
);
// Accept: prefer HTML, XML; also allow images and generic types.
headers.insert(
ACCEPT,
HeaderValue::from_static(
"text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8",
),
);
// Accept-Encoding: Inform the server we can accept gzip/deflate.
// (reqwest handles decompression automatically.)
headers.insert(ACCEPT_ENCODING, HeaderValue::from_static("gzip, deflate"));
// Referer: mirrors the original script's "login entry" intent (safe placeholder for now).
headers.insert(
REFERER,
HeaderValue::from_static("https://learning.oreilly.com/login/unified/?next=/home/"),
);
// Cookie: **all authentication lives here** (cookies-only flow).
// IMPORTANT: HeaderValue::from_str validates and rejects invalid bytes.
headers.insert(COOKIE, HeaderValue::from_str(cookie_header)?);
Ok(headers)
}
/// Create an HttpClient from a CookieStore (preferred path).
pub fn from_store(store: &CookieStore) -> Result<Self> {
let cookie_header = store.to_header_value();
Self::new(&cookie_header)
}
/// Create an HttpClient from a pre-rendered "Cookie: ..." value.
pub fn new(cookie_header: &str) -> Result<Self> {
let headers = Self::build_default_headers(cookie_header)?;
let client = Client::builder().default_headers(headers).build()?;
Ok(Self {
client,
cookie_header: cookie_header.to_string(),
})
}
/// Access the underlying reqwest client (read-only).
pub fn client(&self) -> &Client {
&self.client
}
/// Expose the cookie header for tests/diagnostics (do **not** log this in production).
pub fn cookie_header(&self) -> &str {
&self.cookie_header
}
}
#[cfg(test)]
mod tests {
use super::*;
use crate::cookies::CookieStore;
use serde_json::json;
#[test]
fn builds_client_with_cookie_header_from_map() {
let v = json!({ "sess": "abc", "OptanonConsent": "xyz" });
let store = CookieStore::from_value(v).unwrap();
let hc = HttpClient::from_store(&store).unwrap();
// Deterministic order (sorted by name)
assert_eq!(hc.cookie_header(), "OptanonConsent=xyz; sess=abc");
// We don't assert on internal reqwest headers here; the presence of the header value suffices.
}
#[test]
fn builds_client_with_cookie_header_from_list() {
let v = json!([
{"name": "a", "value": "1"},
{"name": "b", "value": "2"}
]);
let store = CookieStore::from_value(v).unwrap();
let hc = HttpClient::from_store(&store).unwrap();
assert_eq!(hc.cookie_header(), "a=1; b=2");
}
}
|