ptth/crates/ptth_server/src/file_server/mod.rs

622 lines
14 KiB
Rust
Raw Normal View History

2020-10-30 22:38:23 +00:00
// Static file server that can plug into the PTTH reverse server
2020-11-29 19:05:28 +00:00
// I'm not sure if I like this one
#![allow (clippy::enum_glob_use)]
2020-10-30 22:38:23 +00:00
use std::{
borrow::Cow,
cmp::min,
2020-11-29 19:05:28 +00:00
collections::HashMap,
convert::{Infallible, TryFrom, TryInto},
fmt::Debug,
2020-10-30 22:38:23 +00:00
io::SeekFrom,
path::{Path, PathBuf},
2020-10-30 22:38:23 +00:00
};
use handlebars::Handlebars;
2020-11-29 19:05:28 +00:00
use percent_encoding::{
percent_decode,
};
use serde::Serialize;
2020-10-30 22:38:23 +00:00
use tokio::{
fs::{
DirEntry,
2020-10-30 22:38:23 +00:00
File,
read_dir,
ReadDir,
},
io::AsyncReadExt,
sync::mpsc::{
channel,
},
};
use tracing::instrument;
2020-10-30 22:38:23 +00:00
#[cfg (test)]
use always_equal::test::AlwaysEqual;
#[cfg (not (test))]
use always_equal::prod::AlwaysEqual;
2020-11-27 00:03:11 +00:00
use ptth_core::{
http_serde::{
Method,
Response,
StatusCode,
},
prelude::*,
prefix_match,
};
pub mod errors;
mod markdown;
2020-11-29 22:31:54 +00:00
mod range;
use errors::FileServerError;
use markdown::render_styled;
mod emoji {
pub const VIDEO: &str = "\u{1f39e}\u{fe0f}";
pub const PICTURE: &str = "\u{1f4f7}";
pub const FILE: &str = "\u{1f4c4}";
pub const FOLDER: &str = "\u{1f4c1}";
pub const ERROR: &str = "\u{26a0}\u{fe0f}";
}
#[derive (Debug, Serialize)]
pub struct ServerInfo {
pub server_name: String,
}
#[derive (Serialize)]
struct TemplateDirEntry {
icon: &'static str,
trailing_slash: &'static str,
// Unfortunately file_name will allocate as long as some platforms
// (Windows!) aren't UTF-8. Cause I don't want to write separate code
// for such a small problem.
file_name: String,
// This could be a Cow with file_name if no encoding was done but
// it's simpler to allocate.
encoded_file_name: String,
size: Cow <'static, str>,
error: bool,
}
#[derive (Serialize)]
struct TemplateDirPage <'a> {
#[serde (flatten)]
server_info: &'a ServerInfo,
path: Cow <'a, str>,
entries: Vec <TemplateDirEntry>,
}
2020-10-30 22:38:23 +00:00
2020-11-25 00:16:14 +00:00
fn get_icon (file_name: &str) -> &'static str {
if
file_name.ends_with (".mp4") ||
file_name.ends_with (".avi") ||
file_name.ends_with (".mkv") ||
file_name.ends_with (".webm")
{
emoji::VIDEO
2020-11-25 00:16:14 +00:00
}
else if
file_name.ends_with (".jpg") ||
file_name.ends_with (".jpeg") ||
file_name.ends_with (".png") ||
file_name.ends_with (".bmp")
{
emoji::PICTURE
2020-11-25 00:16:14 +00:00
}
else {
emoji::FILE
2020-11-25 00:16:14 +00:00
}
}
async fn read_dir_entry (entry: DirEntry) -> TemplateDirEntry
{
2020-11-29 19:05:28 +00:00
use percent_encoding::{
CONTROLS,
utf8_percent_encode,
};
let file_name = match entry.file_name ().into_string () {
Ok (x) => x,
Err (_) => return TemplateDirEntry {
icon: emoji::ERROR,
trailing_slash: "",
file_name: "File / directory name is not UTF-8".into (),
encoded_file_name: "".into (),
size: "".into (),
error: true,
},
};
let metadata = match entry.metadata ().await {
Ok (x) => x,
Err (_) => return TemplateDirEntry {
icon: emoji::ERROR,
trailing_slash: "",
file_name: "Could not fetch metadata".into (),
encoded_file_name: "".into (),
size: "".into (),
error: true,
},
};
let (trailing_slash, icon, size) = {
let t = metadata.file_type ();
if t.is_dir () {
("/", emoji::FOLDER, "".into ())
}
else {
2020-11-25 00:16:14 +00:00
("", get_icon (&file_name), pretty_print_bytes (metadata.len ()).into ())
}
};
let encoded_file_name = utf8_percent_encode (&file_name, CONTROLS).to_string ();
TemplateDirEntry {
icon,
trailing_slash: &trailing_slash,
file_name,
encoded_file_name,
size,
error: false,
}
}
async fn serve_root (
handlebars: &Handlebars <'static>,
server_info: &ServerInfo
) -> Result <Response, FileServerError>
{
let s = handlebars.render ("file_server_root", &server_info)?;
Ok (serve_html (s))
}
fn serve_html (s: String) -> Response {
let mut resp = Response::default ();
resp
.header ("content-type".to_string (), "text/html; charset=UTF-8".to_string ().into_bytes ())
.body_bytes (s.into_bytes ())
;
resp
}
#[instrument (level = "debug", skip (handlebars, dir))]
async fn serve_dir (
handlebars: &Handlebars <'static>,
server_info: &ServerInfo,
path: Cow <'_, str>,
mut dir: ReadDir
2020-11-29 19:47:40 +00:00
) -> Result <Response, FileServerError>
{
let mut entries = vec! [];
2020-10-30 22:38:23 +00:00
while let Ok (Some (entry)) = dir.next_entry ().await {
entries.push (read_dir_entry (entry).await);
}
2020-10-30 22:38:23 +00:00
2020-11-29 19:47:40 +00:00
entries.sort_unstable_by (|a, b| a.file_name.cmp (&b.file_name));
let s = handlebars.render ("file_server_dir", &TemplateDirPage {
path,
entries,
server_info,
2020-11-29 19:47:40 +00:00
})?;
2020-10-30 22:38:23 +00:00
2020-11-29 19:47:40 +00:00
Ok (serve_html (s))
2020-10-30 22:38:23 +00:00
}
#[instrument (level = "debug", skip (f))]
2020-10-30 22:38:23 +00:00
async fn serve_file (
mut f: File,
should_send_body: bool,
2020-11-29 22:41:48 +00:00
range: range::ValidParsed
)
2020-11-29 19:47:40 +00:00
-> Result <Response, FileServerError>
{
let (tx, rx) = channel (1);
2020-10-30 22:38:23 +00:00
let body = if should_send_body {
Some (rx)
2020-10-30 22:38:23 +00:00
}
else {
None
};
2020-11-29 22:31:54 +00:00
let (range, range_requested) = (range.range, range.range_requested);
info! ("Serving range {}-{}", range.start, range.end);
2020-10-30 22:38:23 +00:00
let content_length = range.end - range.start;
2020-10-30 22:38:23 +00:00
let seek = SeekFrom::Start (range.start);
2020-11-29 19:47:40 +00:00
f.seek (seek).await?;
2020-10-30 22:38:23 +00:00
if should_send_body {
tokio::spawn (async move {
let mut tx = tx;
let mut bytes_sent = 0;
let mut bytes_left = content_length;
2020-10-30 22:38:23 +00:00
2020-11-09 16:33:13 +00:00
let mark_interval = 200_000;
let mut next_mark = mark_interval;
2020-10-30 22:38:23 +00:00
loop {
2020-11-29 19:05:28 +00:00
let mut buffer = vec! [0_u8; 65_536];
let bytes_read = f.read (&mut buffer).await.expect ("Couldn't read from file");
2020-10-30 22:38:23 +00:00
if bytes_read == 0 {
break;
}
buffer.truncate (bytes_read);
let bytes_read_64 = u64::try_from (bytes_read).expect ("Couldn't fit usize into u64");
let bytes_read_64 = min (bytes_left, bytes_read_64);
if tx.send (Ok::<_, Infallible> (buffer)).await.is_err () {
warn! ("Cancelling file stream (Sent {} out of {} bytes)", bytes_sent, content_length);
2020-10-30 22:38:23 +00:00
break;
}
bytes_left -= bytes_read_64;
2020-10-30 22:38:23 +00:00
if bytes_left == 0 {
debug! ("Finished");
2020-10-30 22:38:23 +00:00
break;
}
bytes_sent += bytes_read_64;
2020-11-09 16:33:13 +00:00
while next_mark <= bytes_sent {
trace! ("Sent {} bytes", next_mark);
next_mark += mark_interval;
}
2020-10-30 22:38:23 +00:00
//delay_for (Duration::from_millis (50)).await;
}
});
}
let mut response = Response::default ();
2020-10-30 22:38:23 +00:00
response.header (String::from ("accept-ranges"), b"bytes".to_vec ());
if range_requested {
response.status_code (StatusCode::PartialContent);
response.header (String::from ("content-range"), format! ("bytes {}-{}/{}", range.start, range.end - 1, range.end).into_bytes ());
}
else {
response.status_code (StatusCode::Ok);
response.header (String::from ("content-length"), range.end.to_string ().into_bytes ());
}
2020-11-29 19:05:28 +00:00
if should_send_body {
response.content_length = Some (content_length);
2020-10-30 22:38:23 +00:00
}
else {
2020-11-29 19:05:28 +00:00
response.status_code (StatusCode::NoContent);
}
2020-10-30 22:38:23 +00:00
if let Some (body) = body {
response.body (body);
}
2020-11-29 19:47:40 +00:00
Ok (response)
2020-10-30 22:38:23 +00:00
}
// Sort of an internal API endpoint to make testing work better.
// Eventually we could expose this as JSON or Msgpack or whatever. For now
// it's just a Rust struct that we can test on without caring about
// human-readable HTML
#[derive (Debug, PartialEq)]
struct ServeDirParams {
path: PathBuf,
dir: AlwaysEqual <ReadDir>,
}
#[derive (Debug, PartialEq)]
struct ServeFileParams {
send_body: bool,
2020-11-29 22:41:48 +00:00
range: range::ValidParsed,
file: AlwaysEqual <File>,
}
#[derive (Debug, PartialEq)]
enum InternalResponse {
Favicon,
Forbidden,
InvalidQuery,
MethodNotAllowed,
NotFound,
RangeNotSatisfiable (u64),
Redirect (String),
Root,
ServeDir (ServeDirParams),
ServeFile (ServeFileParams),
MarkdownErr (markdown::Error),
MarkdownPreview (String),
}
fn internal_serve_dir (
path_s: &str,
path: &Path,
dir: tokio::fs::ReadDir,
full_path: PathBuf,
uri: &http::Uri
)
-> Result <InternalResponse, FileServerError>
{
let has_trailing_slash = path_s.is_empty () || path_s.ends_with ('/');
if ! has_trailing_slash {
let file_name = path.file_name ().ok_or (FileServerError::NoFileNameRequested)?;
let file_name = file_name.to_str ().ok_or (FileServerError::FilePathNotUtf8)?;
return Ok (InternalResponse::Redirect (format! ("{}/", file_name)));
}
if uri.query ().is_some () {
return Ok (InternalResponse::InvalidQuery);
}
let dir = dir.into ();
Ok (InternalResponse::ServeDir (ServeDirParams {
dir,
path: full_path,
}))
}
async fn internal_serve_file (
mut file: tokio::fs::File,
uri: &http::Uri,
send_body: bool,
headers: &HashMap <String, Vec <u8>>
)
-> Result <InternalResponse, FileServerError>
{
use std::os::unix::fs::PermissionsExt;
let file_md = file.metadata ().await.map_err (FileServerError::CantGetFileMetadata)?;
if file_md.permissions ().mode () == super::load_toml::CONFIG_PERMISSIONS_MODE
{
return Ok (InternalResponse::Forbidden);
}
let file_len = file_md.len ();
let range_header = headers.get ("range").and_then (|v| std::str::from_utf8 (v).ok ());
2020-11-29 22:41:48 +00:00
Ok (match range::check (range_header, file_len) {
range::Parsed::NotSatisfiable (file_len) => InternalResponse::RangeNotSatisfiable (file_len),
range::Parsed::Valid (range) => {
if uri.query () == Some ("as_markdown") {
2020-11-29 22:41:48 +00:00
const MAX_BUF_SIZE: u32 = 1_000_000;
2020-11-29 22:31:54 +00:00
if range.range_requested {
return Ok (InternalResponse::InvalidQuery);
}
if file_len > MAX_BUF_SIZE.into () {
InternalResponse::MarkdownErr (markdown::Error::TooBig)
}
else {
let mut buffer = vec! [0_u8; MAX_BUF_SIZE.try_into ().expect ("Couldn't fit u32 into usize")];
let bytes_read = file.read (&mut buffer).await?;
buffer.truncate (bytes_read);
match render_styled (&buffer) {
Ok (x) => InternalResponse::MarkdownPreview (x),
Err (x) => InternalResponse::MarkdownErr (x),
}
}
}
else {
let file = file.into ();
InternalResponse::ServeFile (ServeFileParams {
file,
send_body,
range,
})
}
},
})
}
async fn internal_serve_all (
root: &Path,
method: Method,
uri: &str,
headers: &HashMap <String, Vec <u8>>,
hidden_path: Option <&Path>
2020-10-30 22:38:23 +00:00
)
2020-11-29 19:47:40 +00:00
-> Result <InternalResponse, FileServerError>
2020-10-30 22:38:23 +00:00
{
use std::str::FromStr;
use InternalResponse::*;
info! ("Client requested {}", uri);
2020-10-30 22:38:23 +00:00
let uri = http::Uri::from_str (uri).map_err (FileServerError::InvalidUri)?;
let send_body = match &method {
Method::Get => true,
Method::Head => false,
m => {
debug! ("Unsupported method {:?}", m);
2020-11-29 19:47:40 +00:00
return Ok (MethodNotAllowed);
}
};
2020-10-30 22:38:23 +00:00
if uri.path () == "/favicon.ico" {
2020-11-29 19:47:40 +00:00
return Ok (Favicon);
}
let path = match prefix_match ("/files", uri.path ()) {
Some (x) => x,
2020-11-29 19:47:40 +00:00
None => return Ok (Root),
};
2020-10-30 22:38:23 +00:00
if path == "" {
2020-11-29 19:47:40 +00:00
return Ok (Redirect ("files/".to_string ()));
}
// TODO: There is totally a dir traversal attack in here somewhere
let encoded_path = &path [1..];
2020-11-29 19:47:40 +00:00
let path_s = percent_decode (encoded_path.as_bytes ()).decode_utf8 ().map_err (FileServerError::PathNotUtf8)?;
let path = Path::new (&*path_s);
2020-10-30 22:38:23 +00:00
let full_path = root.join (path);
2020-10-30 22:38:23 +00:00
debug! ("full_path = {:?}", full_path);
if let Some (hidden_path) = hidden_path {
if full_path == hidden_path {
2020-11-29 19:47:40 +00:00
return Ok (Forbidden);
}
}
if let Ok (dir) = read_dir (&full_path).await {
internal_serve_dir (
&path_s,
path,
dir,
full_path,
&uri
)
2020-10-30 22:38:23 +00:00
}
else if let Ok (file) = File::open (&full_path).await {
internal_serve_file (
file,
&uri,
send_body,
headers
).await
2020-10-30 22:38:23 +00:00
}
else {
Ok (NotFound)
}
}
#[instrument (level = "debug", skip (handlebars, headers))]
pub async fn serve_all (
handlebars: &Handlebars <'static>,
server_info: &ServerInfo,
root: &Path,
method: Method,
uri: &str,
headers: &HashMap <String, Vec <u8>>,
hidden_path: Option <&Path>
)
-> Result <Response, FileServerError>
{
use InternalResponse::*;
fn serve_error <S: Into <Vec <u8>>> (
status_code: StatusCode,
msg: S
)
-> Response
{
let mut resp = Response::default ();
resp.status_code (status_code);
resp.body_bytes (msg.into ());
resp
}
2020-11-29 19:47:40 +00:00
Ok (match internal_serve_all (root, method, uri, headers, hidden_path).await? {
Favicon => serve_error (StatusCode::NotFound, ""),
Forbidden => serve_error (StatusCode::Forbidden, "403 Forbidden"),
InvalidQuery => serve_error (StatusCode::BadRequest, "Query is invalid for this object"),
MethodNotAllowed => serve_error (StatusCode::MethodNotAllowed, "Unsupported method"),
NotFound => serve_error (StatusCode::NotFound, "404 Not Found"),
RangeNotSatisfiable (file_len) => {
let mut resp = Response::default ();
resp.status_code (StatusCode::RangeNotSatisfiable)
.header ("content-range".to_string (), format! ("bytes */{}", file_len).into_bytes ());
resp
},
Redirect (location) => {
let mut resp = Response::default ();
resp.status_code (StatusCode::TemporaryRedirect);
resp.header ("location".to_string (), location.into_bytes ());
resp.body_bytes (b"Redirecting...".to_vec ());
resp
},
Root => serve_root (handlebars, server_info).await?,
ServeDir (ServeDirParams {
path,
dir,
2020-11-29 19:47:40 +00:00
}) => serve_dir (handlebars, server_info, path.to_string_lossy (), dir.into_inner ()).await?,
ServeFile (ServeFileParams {
file,
send_body,
range,
2020-11-29 22:31:54 +00:00
}) => serve_file (file.into_inner (), send_body, range).await?,
MarkdownErr (e) => {
use markdown::Error::*;
let code = match &e {
TooBig => StatusCode::InternalServerError,
//NotMarkdown => serve_error (StatusCode::BadRequest, "File is not Markdown"),
NotUtf8 => StatusCode::BadRequest,
};
serve_error (code, e.to_string ())
},
MarkdownPreview (s) => serve_html (s),
})
2020-10-30 22:38:23 +00:00
}
pub fn load_templates (
asset_root: &Path
)
-> Result <Handlebars <'static>, handlebars::TemplateFileError>
{
2020-10-31 20:46:38 +00:00
let mut handlebars = Handlebars::new ();
handlebars.set_strict_mode (true);
let asset_root = asset_root.join ("handlebars/server");
2020-11-29 19:05:28 +00:00
for (k, v) in &[
2020-10-31 20:46:38 +00:00
("file_server_dir", "file_server_dir.html"),
("file_server_root", "file_server_root.html"),
2020-11-29 19:05:28 +00:00
] {
handlebars.register_template_file (k, asset_root.join (v))?;
}
Ok (handlebars)
}
fn pretty_print_bytes (b: u64) -> String {
if b < 1024 {
format! ("{} B", b)
}
else if (b + 512) < 1024 * 1024 {
format! ("{} KiB", (b + 512) / 1024)
}
else if (b + 512 * 1024) < 1024 * 1024 * 1024 {
format! ("{} MiB", (b + 512 * 1024) / 1024 / 1024)
}
else {
format! ("{} GiB", (b + 512 * 1024 * 1024) / 1024 / 1024 / 1024)
}
}
#[cfg (test)]
mod tests;