2017-01-25 18:51:41 +01:00
|
|
|
// Copyright 2015-2017 Parity Technologies (UK) Ltd.
|
2016-09-27 16:27:06 +02:00
|
|
|
// This file is part of Parity.
|
|
|
|
|
|
|
|
// Parity is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
|
|
|
|
// Parity is distributed in the hope that it will be useful,
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU General Public License for more details.
|
|
|
|
|
|
|
|
// You should have received a copy of the GNU General Public License
|
|
|
|
// along with Parity. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
use futures::future::{self, Loop};
|
|
|
|
use futures::sync::{mpsc, oneshot};
|
|
|
|
use futures::{self, Future, Async, Sink, Stream};
|
|
|
|
use futures_timer::FutureExt;
|
|
|
|
use hyper::header::{UserAgent, Location, ContentLength, ContentType};
|
|
|
|
use hyper::mime::Mime;
|
|
|
|
use hyper::{self, Request, Method, StatusCode};
|
|
|
|
use hyper_rustls;
|
|
|
|
use std;
|
|
|
|
use std::cmp::min;
|
2016-12-22 18:26:39 +01:00
|
|
|
use std::sync::Arc;
|
2018-03-14 13:40:54 +01:00
|
|
|
use std::sync::atomic::{AtomicBool, AtomicUsize, Ordering};
|
|
|
|
use std::sync::mpsc::RecvTimeoutError;
|
|
|
|
use std::thread;
|
|
|
|
use std::time::Duration;
|
|
|
|
use std::{io, fmt};
|
|
|
|
use tokio_core::reactor;
|
|
|
|
use url::{self, Url};
|
|
|
|
|
|
|
|
const MAX_SIZE: usize = 64 * 1024 * 1024;
|
|
|
|
const MAX_SECS: u64 = 5;
|
|
|
|
const MAX_REDR: usize = 5;
|
|
|
|
|
|
|
|
/// A handle to abort requests.
|
|
|
|
///
|
|
|
|
/// Requests are either aborted based on reaching thresholds such as
|
|
|
|
/// maximum response size, timeouts or too many redirects, or else
|
|
|
|
/// they can be aborted explicitly by the calling code.
|
|
|
|
#[derive(Clone, Debug)]
|
|
|
|
pub struct Abort {
|
|
|
|
abort: Arc<AtomicBool>,
|
|
|
|
size: usize,
|
|
|
|
time: Duration,
|
|
|
|
redir: usize,
|
|
|
|
}
|
2016-09-27 16:27:06 +02:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
impl Default for Abort {
|
|
|
|
fn default() -> Abort {
|
|
|
|
Abort {
|
|
|
|
abort: Arc::new(AtomicBool::new(false)),
|
|
|
|
size: MAX_SIZE,
|
|
|
|
time: Duration::from_secs(MAX_SECS),
|
|
|
|
redir: MAX_REDR,
|
|
|
|
}
|
2016-09-27 16:27:06 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-12-22 18:26:39 +01:00
|
|
|
impl From<Arc<AtomicBool>> for Abort {
|
2018-03-14 13:40:54 +01:00
|
|
|
fn from(a: Arc<AtomicBool>) -> Abort {
|
|
|
|
Abort {
|
|
|
|
abort: a,
|
|
|
|
size: MAX_SIZE,
|
|
|
|
time: Duration::from_secs(MAX_SECS),
|
|
|
|
redir: MAX_REDR,
|
|
|
|
}
|
2016-09-27 16:27:06 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
impl Abort {
|
|
|
|
/// True if `abort` has been invoked.
|
|
|
|
pub fn is_aborted(&self) -> bool {
|
|
|
|
self.abort.load(Ordering::SeqCst)
|
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
/// The maximum response body size.
|
|
|
|
pub fn max_size(&self) -> usize {
|
|
|
|
self.size
|
|
|
|
}
|
2016-12-27 16:38:55 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
/// The maximum total time, including redirects.
|
|
|
|
pub fn max_duration(&self) -> Duration {
|
|
|
|
self.time
|
2016-12-27 11:15:02 +01:00
|
|
|
}
|
2016-09-27 16:27:06 +02:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
/// The maximum number of redirects to allow.
|
|
|
|
pub fn max_redirects(&self) -> usize {
|
|
|
|
self.redir
|
2017-10-05 12:35:01 +02:00
|
|
|
}
|
2017-07-16 18:22:45 +02:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
/// Mark as aborted.
|
|
|
|
pub fn abort(&self) {
|
|
|
|
self.abort.store(true, Ordering::SeqCst)
|
|
|
|
}
|
2016-09-27 16:27:06 +02:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
/// Set the maximum reponse body size.
|
|
|
|
pub fn with_max_size(self, n: usize) -> Abort {
|
|
|
|
Abort { size: n, .. self }
|
2016-09-27 16:27:06 +02:00
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
/// Set the maximum duration (including redirects).
|
|
|
|
pub fn with_max_duration(self, d: Duration) -> Abort {
|
|
|
|
Abort { time: d, .. self }
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
/// Set the maximum number of redirects to follow.
|
|
|
|
pub fn with_max_redirects(self, n: usize) -> Abort {
|
|
|
|
Abort { redir: n, .. self }
|
|
|
|
}
|
2016-09-27 16:27:06 +02:00
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
/// Types which retrieve content from some URL.
|
|
|
|
pub trait Fetch: Clone + Send + Sync + 'static {
|
|
|
|
/// The result future.
|
|
|
|
type Result: Future<Item=Response, Error=Error> + Send + 'static;
|
|
|
|
|
|
|
|
/// Get content from some URL.
|
|
|
|
fn fetch(&self, url: &str, abort: Abort) -> Self::Result;
|
|
|
|
}
|
2017-02-02 19:11:28 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
type TxResponse = oneshot::Sender<Result<Response, Error>>;
|
|
|
|
type TxStartup = std::sync::mpsc::SyncSender<Result<(), io::Error>>;
|
|
|
|
type ChanItem = Option<(Url, Abort, TxResponse)>;
|
|
|
|
|
|
|
|
/// An implementation of `Fetch` using a `hyper` client.
|
|
|
|
// Due to the `Send` bound of `Fetch` we spawn a background thread for
|
|
|
|
// actual request/response processing as `hyper::Client` itself does
|
|
|
|
// not implement `Send` currently.
|
|
|
|
#[derive(Debug)]
|
2016-09-27 16:27:06 +02:00
|
|
|
pub struct Client {
|
2018-03-14 13:40:54 +01:00
|
|
|
core: mpsc::Sender<ChanItem>,
|
|
|
|
refs: Arc<AtomicUsize>,
|
2016-09-27 16:27:06 +02:00
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
// When cloning a client we increment the internal reference counter.
|
2017-02-02 19:11:28 +01:00
|
|
|
impl Clone for Client {
|
2018-03-14 13:40:54 +01:00
|
|
|
fn clone(&self) -> Client {
|
|
|
|
self.refs.fetch_add(1, Ordering::SeqCst);
|
2017-02-02 19:11:28 +01:00
|
|
|
Client {
|
2018-03-14 13:40:54 +01:00
|
|
|
core: self.core.clone(),
|
|
|
|
refs: self.refs.clone(),
|
2017-02-02 19:11:28 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
// When dropping a client, we decrement the reference counter.
|
|
|
|
// Once it reaches 0 we terminate the background thread.
|
|
|
|
impl Drop for Client {
|
|
|
|
fn drop(&mut self) {
|
|
|
|
if self.refs.fetch_sub(1, Ordering::SeqCst) == 1 {
|
|
|
|
// ignore send error as it means the background thread is gone already
|
|
|
|
let _ = self.core.clone().send(None).wait();
|
|
|
|
}
|
2017-02-02 19:11:28 +01:00
|
|
|
}
|
2018-03-14 13:40:54 +01:00
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
impl Client {
|
|
|
|
/// Create a new fetch client.
|
|
|
|
pub fn new() -> Result<Self, Error> {
|
|
|
|
let (tx_start, rx_start) = std::sync::mpsc::sync_channel(1);
|
|
|
|
let (tx_proto, rx_proto) = mpsc::channel(64);
|
2017-02-02 19:11:28 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
Client::background_thread(tx_start, rx_proto)?;
|
2018-02-22 11:22:25 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
match rx_start.recv_timeout(Duration::from_secs(10)) {
|
|
|
|
Err(RecvTimeoutError::Timeout) => {
|
|
|
|
error!(target: "fetch", "timeout starting background thread");
|
|
|
|
return Err(Error::BackgroundThreadDead)
|
2017-02-02 19:11:28 +01:00
|
|
|
}
|
2018-03-14 13:40:54 +01:00
|
|
|
Err(RecvTimeoutError::Disconnected) => {
|
|
|
|
error!(target: "fetch", "background thread gone");
|
|
|
|
return Err(Error::BackgroundThreadDead)
|
|
|
|
}
|
|
|
|
Ok(Err(e)) => {
|
|
|
|
error!(target: "fetch", "error starting background thread: {}", e);
|
|
|
|
return Err(e.into())
|
|
|
|
}
|
|
|
|
Ok(Ok(())) => {}
|
2017-02-02 19:11:28 +01:00
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
Ok(Client {
|
|
|
|
core: tx_proto,
|
|
|
|
refs: Arc::new(AtomicUsize::new(1)),
|
|
|
|
})
|
2017-02-02 19:11:28 +01:00
|
|
|
}
|
2017-07-11 12:23:46 +02:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
fn background_thread(tx_start: TxStartup, rx_proto: mpsc::Receiver<ChanItem>) -> io::Result<thread::JoinHandle<()>> {
|
|
|
|
thread::Builder::new().name("fetch".into()).spawn(move || {
|
|
|
|
let mut core = match reactor::Core::new() {
|
|
|
|
Ok(c) => c,
|
|
|
|
Err(e) => return tx_start.send(Err(e)).unwrap_or(())
|
|
|
|
};
|
|
|
|
|
|
|
|
let handle = core.handle();
|
|
|
|
let hyper = hyper::Client::configure()
|
|
|
|
.connector(hyper_rustls::HttpsConnector::new(4, &core.handle()))
|
|
|
|
.build(&core.handle());
|
|
|
|
|
|
|
|
let future = rx_proto.take_while(|item| Ok(item.is_some()))
|
|
|
|
.map(|item| item.expect("`take_while` is only passing on channel items != None; qed"))
|
|
|
|
.for_each(|(url, abort, sender)|
|
|
|
|
{
|
|
|
|
trace!(target: "fetch", "new request to {}", url);
|
|
|
|
if abort.is_aborted() {
|
|
|
|
return future::ok(sender.send(Err(Error::Aborted)).unwrap_or(()))
|
|
|
|
}
|
|
|
|
let ini = (hyper.clone(), url, abort, 0);
|
|
|
|
let fut = future::loop_fn(ini, |(client, url, abort, redirects)| {
|
|
|
|
let url2 = url.clone();
|
|
|
|
let abort2 = abort.clone();
|
|
|
|
client.request(get(&url))
|
|
|
|
.map(move |resp| Response::new(url2, resp, abort2))
|
|
|
|
.from_err()
|
|
|
|
.and_then(move |resp| {
|
|
|
|
if abort.is_aborted() {
|
|
|
|
debug!(target: "fetch", "fetch of {} aborted", url);
|
|
|
|
return Err(Error::Aborted)
|
|
|
|
}
|
|
|
|
if let Some(next_url) = redirect_location(url, &resp) {
|
|
|
|
if redirects >= abort.max_redirects() {
|
|
|
|
return Err(Error::TooManyRedirects)
|
|
|
|
}
|
|
|
|
Ok(Loop::Continue((client, next_url, abort, redirects + 1)))
|
|
|
|
} else {
|
|
|
|
let content_len = resp.headers.get::<ContentLength>().cloned();
|
|
|
|
if content_len.map(|n| *n > abort.max_size() as u64).unwrap_or(false) {
|
|
|
|
return Err(Error::SizeLimit)
|
|
|
|
}
|
|
|
|
Ok(Loop::Break(resp))
|
|
|
|
}
|
|
|
|
})
|
|
|
|
})
|
|
|
|
.then(|result| {
|
|
|
|
future::ok(sender.send(result).unwrap_or(()))
|
|
|
|
});
|
|
|
|
handle.spawn(fut);
|
|
|
|
trace!(target: "fetch", "waiting for next request ...");
|
|
|
|
future::ok(())
|
|
|
|
});
|
|
|
|
|
|
|
|
tx_start.send(Ok(())).unwrap_or(());
|
|
|
|
|
|
|
|
debug!(target: "fetch", "processing requests ...");
|
|
|
|
if let Err(()) = core.run(future) {
|
|
|
|
error!(target: "fetch", "error while executing future")
|
|
|
|
}
|
|
|
|
debug!(target: "fetch", "fetch background thread finished")
|
|
|
|
})
|
2017-07-11 12:23:46 +02:00
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
impl Fetch for Client {
|
2018-03-14 13:40:54 +01:00
|
|
|
type Result = Box<Future<Item=Response, Error=Error> + Send>;
|
|
|
|
|
|
|
|
fn fetch(&self, url: &str, abort: Abort) -> Self::Result {
|
|
|
|
debug!(target: "fetch", "fetching: {:?}", url);
|
|
|
|
if abort.is_aborted() {
|
|
|
|
return Box::new(future::err(Error::Aborted))
|
2017-02-02 19:11:28 +01:00
|
|
|
}
|
2018-03-14 13:40:54 +01:00
|
|
|
let url: Url = match url.parse() {
|
|
|
|
Ok(u) => u,
|
|
|
|
Err(e) => return Box::new(future::err(e.into()))
|
|
|
|
};
|
|
|
|
let (tx_res, rx_res) = oneshot::channel();
|
|
|
|
let maxdur = abort.max_duration();
|
|
|
|
let sender = self.core.clone();
|
|
|
|
let future = sender.send(Some((url.clone(), abort, tx_res)))
|
|
|
|
.map_err(|e| {
|
|
|
|
error!(target: "fetch", "failed to schedule request: {}", e);
|
|
|
|
Error::BackgroundThreadDead
|
|
|
|
})
|
|
|
|
.and_then(|_| rx_res.map_err(|oneshot::Canceled| Error::BackgroundThreadDead))
|
|
|
|
.and_then(future::result)
|
|
|
|
.timeout(maxdur)
|
|
|
|
.map_err(|err| {
|
|
|
|
if let Error::Io(ref e) = err {
|
|
|
|
if let io::ErrorKind::TimedOut = e.kind() {
|
|
|
|
return Error::Timeout
|
|
|
|
}
|
|
|
|
}
|
|
|
|
err.into()
|
|
|
|
});
|
|
|
|
Box::new(future)
|
2016-09-27 16:27:06 +02:00
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
2016-09-27 16:27:06 +02:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
// Extract redirect location from response.
|
|
|
|
fn redirect_location(u: Url, r: &Response) -> Option<Url> {
|
|
|
|
use hyper::StatusCode::*;
|
|
|
|
match r.status() {
|
|
|
|
MovedPermanently
|
|
|
|
| PermanentRedirect
|
|
|
|
| TemporaryRedirect
|
|
|
|
| Found
|
|
|
|
| SeeOther => {
|
|
|
|
if let Some(loc) = r.headers.get::<Location>() {
|
|
|
|
u.join(loc).ok()
|
|
|
|
} else {
|
|
|
|
None
|
|
|
|
}
|
|
|
|
}
|
|
|
|
_ => None
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Build a simple GET request for the given Url.
|
|
|
|
fn get(u: &Url) -> hyper::Request {
|
|
|
|
let uri = u.as_ref().parse().expect("Every valid URL is aso a URI.");
|
|
|
|
let mut rq = Request::new(Method::Get, uri);
|
|
|
|
rq.headers_mut().set(UserAgent::new("Parity Fetch Neo"));
|
|
|
|
rq
|
|
|
|
}
|
|
|
|
|
|
|
|
/// An HTTP response.
|
|
|
|
#[derive(Debug)]
|
|
|
|
pub struct Response {
|
|
|
|
url: Url,
|
|
|
|
status: StatusCode,
|
|
|
|
headers: hyper::Headers,
|
|
|
|
body: hyper::Body,
|
2016-12-22 18:26:39 +01:00
|
|
|
abort: Abort,
|
2018-03-14 13:40:54 +01:00
|
|
|
nread: usize,
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
impl Response {
|
|
|
|
/// Create a new response, wrapping a hyper response.
|
|
|
|
pub fn new(u: Url, r: hyper::Response, a: Abort) -> Response {
|
|
|
|
Response {
|
|
|
|
url: u,
|
|
|
|
status: r.status(),
|
|
|
|
headers: r.headers().clone(),
|
|
|
|
body: r.body(),
|
|
|
|
abort: a,
|
|
|
|
nread: 0,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// The response status.
|
|
|
|
pub fn status(&self) -> StatusCode {
|
|
|
|
self.status
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Status code == OK (200)?
|
|
|
|
pub fn is_success(&self) -> bool {
|
|
|
|
self.status() == StatusCode::Ok
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Is the content-type text/html?
|
|
|
|
pub fn is_html(&self) -> bool {
|
|
|
|
if let Some(ref mime) = self.content_type() {
|
|
|
|
mime.type_() == "text" && mime.subtype() == "html"
|
|
|
|
} else {
|
|
|
|
false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// The conten-type header value.
|
|
|
|
pub fn content_type(&self) -> Option<Mime> {
|
|
|
|
self.headers.get::<ContentType>().map(|ct| ct.0.clone())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
impl Stream for Response {
|
|
|
|
type Item = hyper::Chunk;
|
2016-12-22 18:26:39 +01:00
|
|
|
type Error = Error;
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
fn poll(&mut self) -> futures::Poll<Option<Self::Item>, Self::Error> {
|
2016-12-22 18:26:39 +01:00
|
|
|
if self.abort.is_aborted() {
|
2018-03-14 13:40:54 +01:00
|
|
|
debug!(target: "fetch", "fetch of {} aborted", self.url);
|
|
|
|
return Err(Error::Aborted)
|
|
|
|
}
|
|
|
|
match try_ready!(self.body.poll()) {
|
|
|
|
None => Ok(Async::Ready(None)),
|
|
|
|
Some(c) => {
|
|
|
|
if self.nread + c.len() > self.abort.max_size() {
|
|
|
|
debug!(target: "fetch", "size limit {:?} for {} exceeded", self.abort.max_size(), self.url);
|
|
|
|
return Err(Error::SizeLimit)
|
|
|
|
}
|
|
|
|
self.nread += c.len();
|
|
|
|
Ok(Async::Ready(Some(c)))
|
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
2018-03-14 13:40:54 +01:00
|
|
|
}
|
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
/// `BodyReader` serves as an adapter from async to sync I/O.
|
|
|
|
///
|
|
|
|
/// It implements `io::Read` by repedately waiting for the next `Chunk`
|
|
|
|
/// of hyper's response `Body` which blocks the current thread.
|
|
|
|
pub struct BodyReader {
|
|
|
|
chunk: hyper::Chunk,
|
|
|
|
body: Option<hyper::Body>,
|
|
|
|
abort: Abort,
|
|
|
|
offset: usize,
|
|
|
|
count: usize,
|
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
impl BodyReader {
|
|
|
|
/// Create a new body reader for the given response.
|
|
|
|
pub fn new(r: Response) -> BodyReader {
|
|
|
|
BodyReader {
|
|
|
|
body: Some(r.body),
|
|
|
|
chunk: Default::default(),
|
|
|
|
abort: r.abort,
|
|
|
|
offset: 0,
|
|
|
|
count: 0,
|
|
|
|
}
|
2016-09-27 16:27:06 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
impl io::Read for BodyReader {
|
|
|
|
fn read(&mut self, buf: &mut [u8]) -> io::Result<usize> {
|
|
|
|
let mut n = 0;
|
|
|
|
while self.body.is_some() {
|
|
|
|
// Can we still read from the current chunk?
|
|
|
|
if self.offset < self.chunk.len() {
|
|
|
|
let k = min(self.chunk.len() - self.offset, buf.len() - n);
|
|
|
|
if self.count + k > self.abort.max_size() {
|
|
|
|
debug!(target: "fetch", "size limit {:?} exceeded", self.abort.max_size());
|
|
|
|
return Err(io::Error::new(io::ErrorKind::PermissionDenied, "size limit exceeded"))
|
|
|
|
}
|
|
|
|
let c = &self.chunk[self.offset .. self.offset + k];
|
|
|
|
(&mut buf[n .. n + k]).copy_from_slice(c);
|
|
|
|
self.offset += k;
|
|
|
|
self.count += k;
|
|
|
|
n += k;
|
|
|
|
if n == buf.len() {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
let body = self.body.take().expect("loop condition ensures `self.body` is always defined; qed");
|
|
|
|
match body.into_future().wait() { // wait for next chunk
|
|
|
|
Err((e, _)) => {
|
|
|
|
error!(target: "fetch", "failed to read chunk: {}", e);
|
|
|
|
return Err(io::Error::new(io::ErrorKind::Other, "failed to read body chunk"))
|
|
|
|
}
|
|
|
|
Ok((None, _)) => break, // body is exhausted, break out of the loop
|
|
|
|
Ok((Some(c), b)) => {
|
|
|
|
self.body = Some(b);
|
|
|
|
self.chunk = c;
|
|
|
|
self.offset = 0
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(n)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Fetch error cases.
|
2016-12-22 18:26:39 +01:00
|
|
|
#[derive(Debug)]
|
|
|
|
pub enum Error {
|
2018-03-14 13:40:54 +01:00
|
|
|
/// Hyper gave us an error.
|
|
|
|
Hyper(hyper::Error),
|
|
|
|
/// Some I/O error occured.
|
|
|
|
Io(io::Error),
|
|
|
|
/// Invalid URLs where attempted to parse.
|
|
|
|
Url(url::ParseError),
|
|
|
|
/// Calling code invoked `Abort::abort`.
|
2016-12-22 18:26:39 +01:00
|
|
|
Aborted,
|
2018-03-14 13:40:54 +01:00
|
|
|
/// Too many redirects have been encountered.
|
|
|
|
TooManyRedirects,
|
|
|
|
/// The maximum duration was reached.
|
|
|
|
Timeout,
|
|
|
|
/// The response body is too large.
|
|
|
|
SizeLimit,
|
|
|
|
/// The background processing thread does not run.
|
|
|
|
BackgroundThreadDead,
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
|
|
|
|
2017-07-11 12:23:46 +02:00
|
|
|
impl fmt::Display for Error {
|
|
|
|
fn fmt(&self, fmt: &mut fmt::Formatter) -> fmt::Result {
|
|
|
|
match *self {
|
|
|
|
Error::Aborted => write!(fmt, "The request has been aborted."),
|
2018-03-14 13:40:54 +01:00
|
|
|
Error::Hyper(ref e) => write!(fmt, "{}", e),
|
|
|
|
Error::Url(ref e) => write!(fmt, "{}", e),
|
|
|
|
Error::Io(ref e) => write!(fmt, "{}", e),
|
|
|
|
Error::BackgroundThreadDead => write!(fmt, "background thread gond"),
|
|
|
|
Error::TooManyRedirects => write!(fmt, "too many redirects"),
|
|
|
|
Error::Timeout => write!(fmt, "request timed out"),
|
|
|
|
Error::SizeLimit => write!(fmt, "size limit reached"),
|
2017-07-11 12:23:46 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
impl From<hyper::Error> for Error {
|
|
|
|
fn from(e: hyper::Error) -> Self {
|
|
|
|
Error::Hyper(e)
|
2016-09-27 16:27:06 +02:00
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
impl From<io::Error> for Error {
|
|
|
|
fn from(e: io::Error) -> Self {
|
|
|
|
Error::Io(e)
|
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
2016-09-27 16:27:06 +02:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
impl From<url::ParseError> for Error {
|
|
|
|
fn from(e: url::ParseError) -> Self {
|
|
|
|
Error::Url(e)
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
#[cfg(test)]
|
|
|
|
mod test {
|
|
|
|
use super::*;
|
|
|
|
use futures::future;
|
|
|
|
use futures::sync::mpsc;
|
|
|
|
use futures_timer::Delay;
|
|
|
|
use hyper::StatusCode;
|
|
|
|
use hyper::server::{Http, Request, Response, Service};
|
|
|
|
use std;
|
|
|
|
use std::io::Read;
|
|
|
|
use std::net::SocketAddr;
|
|
|
|
|
|
|
|
const ADDRESS: &str = "127.0.0.1:0";
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn it_should_fetch() {
|
|
|
|
let server = TestServer::run();
|
|
|
|
let client = Client::new().unwrap();
|
|
|
|
let future = client.fetch(&format!("http://{}?123", server.addr()), Default::default());
|
|
|
|
let resp = future.wait().unwrap();
|
|
|
|
assert!(resp.is_success());
|
|
|
|
let body = resp.concat2().wait().unwrap();
|
|
|
|
assert_eq!(&body[..], b"123")
|
|
|
|
}
|
2016-09-27 16:27:06 +02:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
#[test]
|
|
|
|
fn it_should_timeout() {
|
|
|
|
let server = TestServer::run();
|
|
|
|
let client = Client::new().unwrap();
|
|
|
|
let abort = Abort::default().with_max_duration(Duration::from_secs(1));
|
|
|
|
match client.fetch(&format!("http://{}/delay?3", server.addr()), abort).wait() {
|
|
|
|
Err(Error::Timeout) => {}
|
|
|
|
other => panic!("expected timeout, got {:?}", other)
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
#[test]
|
|
|
|
fn it_should_follow_redirects() {
|
|
|
|
let server = TestServer::run();
|
|
|
|
let client = Client::new().unwrap();
|
|
|
|
let abort = Abort::default();
|
|
|
|
let future = client.fetch(&format!("http://{}/redirect?http://{}/", server.addr(), server.addr()), abort);
|
|
|
|
assert!(future.wait().unwrap().is_success())
|
2017-02-20 16:30:14 +01:00
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
#[test]
|
|
|
|
fn it_should_follow_relative_redirects() {
|
|
|
|
let server = TestServer::run();
|
|
|
|
let client = Client::new().unwrap();
|
|
|
|
let abort = Abort::default().with_max_redirects(4);
|
|
|
|
let future = client.fetch(&format!("http://{}/redirect?/", server.addr()), abort);
|
|
|
|
assert!(future.wait().unwrap().is_success())
|
|
|
|
}
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn it_should_not_follow_too_many_redirects() {
|
|
|
|
let server = TestServer::run();
|
|
|
|
let client = Client::new().unwrap();
|
|
|
|
let abort = Abort::default().with_max_redirects(3);
|
|
|
|
match client.fetch(&format!("http://{}/loop", server.addr()), abort).wait() {
|
|
|
|
Err(Error::TooManyRedirects) => {}
|
|
|
|
other => panic!("expected too many redirects error, got {:?}", other)
|
2016-12-27 11:15:02 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
#[test]
|
|
|
|
fn it_should_read_data() {
|
|
|
|
let server = TestServer::run();
|
|
|
|
let client = Client::new().unwrap();
|
|
|
|
let abort = Abort::default();
|
|
|
|
let future = client.fetch(&format!("http://{}?abcdefghijklmnopqrstuvwxyz", server.addr()), abort);
|
|
|
|
let resp = future.wait().unwrap();
|
|
|
|
assert!(resp.is_success());
|
|
|
|
assert_eq!(&resp.concat2().wait().unwrap()[..], b"abcdefghijklmnopqrstuvwxyz")
|
2017-02-20 16:30:14 +01:00
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
#[test]
|
|
|
|
fn it_should_not_read_too_much_data() {
|
|
|
|
let server = TestServer::run();
|
|
|
|
let client = Client::new().unwrap();
|
|
|
|
let abort = Abort::default().with_max_size(3);
|
|
|
|
let resp = client.fetch(&format!("http://{}/?1234", server.addr()), abort).wait().unwrap();
|
|
|
|
assert!(resp.is_success());
|
|
|
|
match resp.concat2().wait() {
|
|
|
|
Err(Error::SizeLimit) => {}
|
|
|
|
other => panic!("expected size limit error, got {:?}", other)
|
2016-12-27 11:15:02 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
#[test]
|
|
|
|
fn it_should_not_read_too_much_data_sync() {
|
|
|
|
let server = TestServer::run();
|
|
|
|
let client = Client::new().unwrap();
|
|
|
|
let abort = Abort::default().with_max_size(3);
|
|
|
|
let resp = client.fetch(&format!("http://{}/?1234", server.addr()), abort).wait().unwrap();
|
|
|
|
assert!(resp.is_success());
|
|
|
|
let mut buffer = Vec::new();
|
|
|
|
let mut reader = BodyReader::new(resp);
|
|
|
|
match reader.read_to_end(&mut buffer) {
|
|
|
|
Err(ref e) if e.kind() == io::ErrorKind::PermissionDenied => {}
|
|
|
|
other => panic!("expected size limit error, got {:?}", other)
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
2016-09-27 16:27:06 +02:00
|
|
|
}
|
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
struct TestServer;
|
|
|
|
|
|
|
|
impl Service for TestServer {
|
|
|
|
type Request = Request;
|
|
|
|
type Response = Response;
|
|
|
|
type Error = hyper::Error;
|
|
|
|
type Future = Box<Future<Item=Self::Response, Error=Self::Error>>;
|
|
|
|
|
|
|
|
fn call(&self, req: Request) -> Self::Future {
|
|
|
|
match req.uri().path() {
|
|
|
|
"/" => {
|
|
|
|
let body = req.uri().query().unwrap_or("").to_string();
|
|
|
|
let req = Response::new().with_body(body);
|
|
|
|
Box::new(future::ok(req))
|
|
|
|
}
|
|
|
|
"/redirect" => {
|
|
|
|
let loc = Location::new(req.uri().query().unwrap_or("/").to_string());
|
|
|
|
let req = Response::new()
|
|
|
|
.with_status(StatusCode::MovedPermanently)
|
|
|
|
.with_header(loc);
|
|
|
|
Box::new(future::ok(req))
|
|
|
|
}
|
|
|
|
"/loop" => {
|
|
|
|
let req = Response::new()
|
|
|
|
.with_status(StatusCode::MovedPermanently)
|
|
|
|
.with_header(Location::new("/loop".to_string()));
|
|
|
|
Box::new(future::ok(req))
|
|
|
|
}
|
|
|
|
"/delay" => {
|
|
|
|
let d = Duration::from_secs(req.uri().query().unwrap_or("0").parse().unwrap());
|
|
|
|
Box::new(Delay::new(d).from_err().map(|_| Response::new()))
|
|
|
|
}
|
|
|
|
_ => Box::new(future::ok(Response::new().with_status(StatusCode::NotFound)))
|
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
2018-03-14 13:40:54 +01:00
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
impl TestServer {
|
|
|
|
fn run() -> Handle {
|
|
|
|
let (tx_start, rx_start) = std::sync::mpsc::sync_channel(1);
|
|
|
|
let (tx_end, rx_end) = mpsc::channel(0);
|
|
|
|
let rx_end_fut = rx_end.into_future().map(|_| ()).map_err(|_| ());
|
|
|
|
thread::spawn(move || {
|
|
|
|
let addr = ADDRESS.parse().unwrap();
|
|
|
|
let server = Http::new().bind(&addr, || Ok(TestServer)).unwrap();
|
|
|
|
tx_start.send(server.local_addr().unwrap()).unwrap_or(());
|
|
|
|
server.run_until(rx_end_fut).unwrap();
|
|
|
|
});
|
|
|
|
Handle(rx_start.recv().unwrap(), tx_end)
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
2018-03-14 13:40:54 +01:00
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
struct Handle(SocketAddr, mpsc::Sender<()>);
|
|
|
|
|
|
|
|
impl Handle {
|
|
|
|
fn addr(&self) -> SocketAddr {
|
|
|
|
self.0
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
2018-03-14 13:40:54 +01:00
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
|
2018-03-14 13:40:54 +01:00
|
|
|
impl Drop for Handle {
|
|
|
|
fn drop(&mut self) {
|
|
|
|
self.1.clone().send(()).wait().unwrap();
|
|
|
|
}
|
2016-12-22 18:26:39 +01:00
|
|
|
}
|
|
|
|
}
|