Source code

Revision control

Copy as Markdown

Other Tools

/* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
* file, You can obtain one at https://mozilla.org/MPL/2.0/. */
//! Interface to HTTP requests/responses which will transparently use various backends to send the
//! data.
//!
//! This is far from a general implementation, instead implementing the sort of requests that we
//! need.
use crate::std::{fs::File, path::Path, process::Child};
use anyhow::Context;
use std::io::Read;
#[cfg(mock)]
use crate::std::mock::{mock_key, MockKey};
#[cfg(mock)]
mock_key! {
/// The outer Result is for RequestBuilder::build(), the inner is for Request::send().
pub struct MockHttp => Box<dyn Fn(&RequestBuilder, &str) -> std::io::Result<std::io::Result<Vec<u8>>> + Send + Sync>
}
#[cfg(mock)]
impl MockHttp {
/// If returned from a MockHttp callback, other transports will be attempted.
#[allow(unused)]
pub fn try_others() -> std::io::Result<std::io::Result<Vec<u8>>> {
Err(std::io::ErrorKind::Interrupted.into())
}
}
/// The user agent used by this application.
pub const USER_AGENT: &str = concat!(env!("CARGO_PKG_NAME"), "/", env!("CARGO_PKG_VERSION"));
// TODO set reasonable connect timeout and low speed limit?
/// Types of requests that can be created.
#[derive(Debug, Clone, PartialEq, Eq)]
pub enum RequestBuilder<'a> {
/// Send a POST with multiple mime parts.
MimePost { parts: Vec<MimePart<'a>> },
/// Gzip and POST a file's contents.
#[allow(unused)]
GzipAndPostFile { file: &'a Path },
/// Send a POST.
Post {
body: &'a [u8],
headers: &'a [(String, String)],
},
}
/// A single mime part to send.
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct MimePart<'a> {
pub name: &'a str,
pub content: MimePartContent<'a>,
pub filename: Option<&'a str>,
pub mime_type: Option<&'a str>,
}
/// The content of a mime part.
#[derive(Debug, Clone, PartialEq, Eq)]
pub enum MimePartContent<'a> {
/// Send a file's contents.
File(&'a Path),
/// Send a specific string as the contents.
String(&'a str),
}
/// A request that is ready to be sent.
pub enum Request {
CurlChild {
child: Child,
stdin: Option<Box<dyn Read + Send + 'static>>,
},
LibCurl {
easy: super::libcurl::Easy<'static>,
},
#[cfg(mock)]
Mock {
response: std::io::Result<Vec<u8>>,
},
}
/// Format a `time::Date` using the date format described by RFC 7231, section 7.1.1.2, for use in
/// the HTTP Date header.
fn format_rfc7231_datetime(datetime: time::OffsetDateTime) -> anyhow::Result<String> {
let format = time::macros::format_description!(
"[weekday repr:short], [day] [month repr:short] [year] [hour]:[minute]:[second] GMT"
);
datetime
.to_offset(time::UtcOffset::UTC)
.format(format)
.context("failed to format datetime")
}
fn now_date_header() -> Option<String> {
match format_rfc7231_datetime(time::OffsetDateTime::now_utc()) {
Err(e) => {
log::warn!("failed to format Date header, omitting: {e}");
None
}
Ok(s) => Some(format!("Date: {s}")),
}
}
impl RequestBuilder<'_> {
/// Build the request with the given url.
pub fn build(&self, url: &str) -> std::io::Result<Request> {
// When mocking is enabled, check for that first.
#[cfg(mock)]
if let Some(r) = self.try_send_with_mock(url) {
return r;
}
// Windows 10+ and macOS 10.15+ contain `curl` 7.64.1+ as a system-provided executable, so
// `send_with_curl_executable` should not fail.
//
// Linux distros generally do not contain `curl`, but `libcurl` is very likely to be
// incidentally installed (if not outright part of the distro base packages). Based on a
// cursory look at the debian repositories as an exemplar, the curl executable (rather than
// library) is much less likely to be incidentally installed.
//
// For uniformity, we always will try the curl executable first, then try libcurl if that
// fails.
let curl_err = match self.send_with_curl_executable(url) {
Ok(r) => return Ok(r),
Err(e) => e,
};
// When mocking is enabled, default to _not_ using libcurl (because there is no mock
// interface; it will really use libcurl). However we add a hook to use libcurl for tests
// which want to send real data to some server (which may be a local test server).
#[cfg(mock)]
if !crate::std::mock::try_hook(false, "use_system_libcurl") {
log::error!("use_system_libcurl not enabled and curl failed: {curl_err}");
panic!("no mock handler available to build http request");
}
log::info!("failed to invoke curl ({curl_err}), trying libcurl");
self.send_with_libcurl(url)
}
/// Send the request with the `curl` executable.
fn send_with_curl_executable(&self, url: &str) -> std::io::Result<Request> {
let mut cmd = crate::process::background_command("curl");
let mut stdin: Option<Box<dyn Read + Send + 'static>> = None;
cmd.args(["--user-agent", USER_AGENT]);
match self {
Self::MimePost { parts } => {
for part in parts {
part.curl_command_args(&mut cmd, &mut stdin)?;
}
}
Self::GzipAndPostFile { file } => {
cmd.args(["--header", "Content-Encoding: gzip", "--data-binary", "@-"]);
if let Some(header) = now_date_header() {
cmd.args(["--header", &header]);
}
let encoder = flate2::read::GzEncoder::new(File::open(file)?, Default::default());
stdin = Some(Box::new(encoder));
}
Self::Post { body, headers } => {
for (k, v) in headers.iter() {
cmd.args(["--header", &format!("{k}: {v}")]);
}
cmd.args(["--data-binary", "@-"]);
stdin = Some(Box::new(std::io::Cursor::new(body.to_vec())));
}
}
cmd.arg(url);
cmd.stdin(std::process::Stdio::piped());
cmd.stdout(std::process::Stdio::piped());
cmd.stderr(std::process::Stdio::piped());
cmd.spawn()
.map(move |child| Request::CurlChild { child, stdin })
}
/// Send the request with the `curl` library.
fn send_with_libcurl(&self, url: &str) -> std::io::Result<Request> {
let curl = super::libcurl::load()?;
let mut easy = curl.easy()?;
easy.set_url(url)?;
easy.set_user_agent(USER_AGENT)?;
easy.set_max_redirs(30)?;
match self {
Self::MimePost { parts } => {
let mut mime = easy.mime()?;
for part in parts {
part.curl_mime(&mut mime)?;
}
easy.set_mime_post(mime)?;
}
Self::GzipAndPostFile { file } => {
let mut headers = easy.slist();
headers.append("Content-Encoding: gzip")?;
if let Some(header) = now_date_header() {
headers.append(&header)?;
}
easy.set_headers(headers)?;
let mut encoder =
flate2::read::GzEncoder::new(File::open(file)?, Default::default());
let mut data = Vec::new();
encoder.read_to_end(&mut data)?;
easy.set_postfields(data)?;
}
Self::Post { body, headers } => {
let mut header_list = easy.slist();
for (k, v) in headers.iter() {
header_list.append(&format!("{k}: {v}"))?;
}
easy.set_headers(header_list)?;
easy.set_postfields(*body)?;
}
}
Ok(Request::LibCurl { easy })
}
#[cfg(mock)]
fn try_send_with_mock(&self, url: &str) -> Option<std::io::Result<Request>> {
let result = MockHttp.try_get(|f| f(self, url))?;
if result
.as_ref()
.err()
.map(|e| e.kind() == std::io::ErrorKind::Interrupted)
.unwrap_or(false)
{
None
} else {
Some(result.map(|response| Request::Mock { response }))
}
}
}
impl MimePart<'_> {
fn curl_command_args(
&self,
cmd: &mut crate::std::process::Command,
stdin: &mut Option<Box<dyn Read + Send + 'static>>,
) -> std::io::Result<()> {
use std::fmt::Write;
let mut formarg = format!("{}=", self.name);
match self.content {
MimePartContent::File(f) => {
write!(formarg, "@{}", CurlQuote(&f.display().to_string())).unwrap()
}
MimePartContent::String(s) => {
// `@-` causes the data to be read from stdin, which is desirable to
// not have to worry about process argument string length limitations
// (though they are generally pretty high limits).
write!(formarg, "@-").unwrap();
if stdin
.replace(Box::new(std::io::Cursor::new(s.to_owned())))
.is_some()
{
return Err(std::io::Error::other(
"only one MimePartContent::String supported",
));
}
}
}
if let Some(filename) = self.filename {
write!(formarg, ";filename={}", filename).unwrap();
}
if let Some(mime_type) = self.mime_type {
write!(formarg, ";type={}", mime_type).unwrap();
}
cmd.arg("--form");
cmd.arg(formarg);
Ok(())
}
fn curl_mime(&self, mime: &mut super::libcurl::Mime) -> std::io::Result<()> {
let mut p = mime.add_part()?;
p.set_name(&self.name)?;
match self.content {
MimePartContent::File(f) => {
p.set_filename(&f.display().to_string())?;
p.set_filedata(f)?;
}
MimePartContent::String(s) => {
p.set_data(s.as_bytes())?;
}
}
if let Some(filename) = self.filename {
p.set_filename(filename)?;
}
if let Some(mime_type) = self.mime_type {
p.set_type(mime_type)?;
}
Ok(())
}
}
impl Request {
/// Send the request, returning the response body (if any).
pub fn send(self) -> anyhow::Result<Vec<u8>> {
Ok(match self {
Self::CurlChild { mut child, stdin } => {
if let Some(mut stdin) = stdin {
let mut child_stdin = child
.stdin
.take()
.context("failed to get curl process stdin")?;
std::io::copy(&mut stdin, &mut child_stdin)
.context("failed to write to stdin of curl process")?;
// stdin is dropped at the end of this scope so that the stream gets an EOF,
// otherwise curl will wait for more input.
}
let output = child
.wait_with_output()
.context("failed to wait on curl process")?;
anyhow::ensure!(
output.status.success(),
"process failed (exit status {}) with stderr: {}",
output.status,
String::from_utf8_lossy(&output.stderr)
);
output.stdout
}
Self::LibCurl { easy } => {
let response = easy.perform()?;
let response_code = easy.get_response_code()?;
anyhow::ensure!(
response_code == 200,
"unexpected response code ({response_code}): {}",
String::from_utf8_lossy(&response).as_ref()
);
response
}
#[cfg(mock)]
Self::Mock { response } => response?,
})
}
}
/// Quote a string per https://curl.se/docs/manpage.html#-F.
/// That is, add quote characters and escape " and \ with backslashes.
struct CurlQuote<'a>(&'a str);
impl CurlQuote<'_> {
fn quoted(&self) -> String {
let quote = std::iter::once(&b'"');
let escaped = self.0.as_bytes().iter().flat_map(|b| match b {
b'"' => br#"\""#.as_slice(),
b'\\' => br#"\\"#.as_slice(),
other => std::slice::from_ref(other),
});
let bytes = quote.clone().chain(escaped).chain(quote).copied().collect();
// # Safety
// The source bytes came from a `str`, so must have been valid utf8. We are inserting valid
// utf8 characters (quotes and backslashes, which are single bytes in utf8) at character
// boundaries (at the beginning/end of the string and before other backslash/quote
// characters).
unsafe { String::from_utf8_unchecked(bytes) }
}
}
impl std::fmt::Display for CurlQuote<'_> {
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
write!(f, "{}", self.quoted())
}
}
#[cfg(test)]
mod test {
use super::*;
#[test]
fn curl_quote() {
assert_eq!(
CurlQuote(r#"hello "world""#).to_string(),
r#""hello \"world\"""#
);
assert_eq!(
CurlQuote(r#"C:\dir\\"\""dir""#).to_string(),
r#""C:\\dir\\\\\"\\\"\"dir\"""#
);
}
}