http-types/src/mime/mod.rs

273 lines
7.8 KiB
Rust

//! IANA Media Types.
//!
//! [Read more](https://developer.mozilla.org/en-US/docs/Web/HTTP/Basics_of_HTTP/MIME_types).
mod constants;
mod parse;
pub use constants::*;
use std::borrow::Cow;
use std::fmt::{self, Debug, Display};
use std::option;
use std::str::FromStr;
use crate::headers::{HeaderValue, ToHeaderValues};
use infer::Infer;
/// An IANA media type.
///
/// ```
/// use http_types::mime::Mime;
/// use std::str::FromStr;
///
/// let mime = Mime::from_str("text/html;charset=utf-8").unwrap();
/// assert_eq!(mime.essence(), "text/html");
/// assert_eq!(mime.param("charset").unwrap(), "utf-8");
/// ```
// NOTE: we cannot statically initialize Strings with values yet, so we keep dedicated static
// fields for the static strings.
#[derive(Clone, PartialEq, Eq, Debug)]
pub struct Mime {
pub(crate) essence: Cow<'static, str>,
pub(crate) basetype: Cow<'static, str>,
pub(crate) subtype: Cow<'static, str>,
// NOTE(yosh): this is a hack because we can't populate vecs in const yet.
// This enables us to encode media types as utf-8 at compilation.
pub(crate) is_utf8: bool,
pub(crate) params: Vec<(ParamName, ParamValue)>,
}
impl Mime {
/// Sniff the mime type from a byte slice.
pub fn sniff(bytes: &[u8]) -> crate::Result<Self> {
let info = Infer::new();
let mime = match info.get(bytes) {
Some(info) => info.mime_type(),
None => crate::bail!("Could not sniff the mime type"),
};
Mime::from_str(mime)
}
/// Guess the mime type from a file extension
pub fn from_extension(extension: impl AsRef<str>) -> Option<Self> {
match extension.as_ref() {
"7z" => Some(SEVENZIP),
"atom" => Some(ATOM),
"avi" => Some(AVI),
"bin" | "exe" | "dll" | "iso" | "img" => Some(BYTE_STREAM),
"bmp" => Some(BMP),
"css" => Some(CSS),
"html" => Some(HTML),
"ico" => Some(ICO),
"js" | "mjs" | "jsonp" => Some(JAVASCRIPT),
"json" => Some(JSON),
"m4a" => Some(M4A),
"mid" | "midi" | "kar" => Some(MIDI),
"mp3" => Some(MP3),
"mp4" => Some(MP4),
"mpeg" | "mpg" => Some(MPEG),
"ogg" => Some(OGG),
"otf" => Some(OTF),
"rss" => Some(RSS),
"svg" | "svgz" => Some(SVG),
"ttf" => Some(TTF),
"txt" => Some(PLAIN),
"wasm" => Some(WASM),
"webm" => Some(WEBM),
"webp" => Some(WEBP),
"woff" => Some(WOFF),
"woff2" => Some(WOFF2),
"xml" => Some(XML),
"zip" => Some(ZIP),
_ => None,
}
}
/// Access the Mime's `type` value.
///
/// According to the spec this method should be named `type`, but that's a reserved keyword in
/// Rust so hence prefix with `base` instead.
pub fn basetype(&self) -> &str {
&self.basetype
}
/// Access the Mime's `subtype` value.
pub fn subtype(&self) -> &str {
&self.subtype
}
/// Access the Mime's `essence` value.
pub fn essence(&self) -> &str {
&self.essence
}
/// Get a reference to a param.
pub fn param(&self, name: impl Into<ParamName>) -> Option<&ParamValue> {
let name: ParamName = name.into();
if name.as_str() == "charset" && self.is_utf8 {
return Some(&ParamValue(Cow::Borrowed("utf-8")));
}
self.params.iter().find(|(k, _)| k == &name).map(|(_, v)| v)
}
/// Remove a param from the set. Returns the `ParamValue` if it was contained within the set.
pub fn remove_param(&mut self, name: impl Into<ParamName>) -> Option<ParamValue> {
let name: ParamName = name.into();
if name.as_str() == "charset" && self.is_utf8 {
self.is_utf8 = false;
return Some(ParamValue(Cow::Borrowed("utf-8")));
}
self.params
.iter()
.position(|(k, _)| k == &name)
.map(|pos| self.params.remove(pos).1)
}
/// Check if this mime is a subtype of another mime.
///
/// # Examples
///
/// ```
/// // All mime types are subsets of */*
/// use http_types::mime::Mime;
/// use std::str::FromStr;
///
/// assert!(Mime::from_str("text/css").unwrap().subset_eq(&Mime::from_str("*/*").unwrap()));
///
/// // A mime type is subset of itself
/// assert!(Mime::from_str("text/css").unwrap().subset_eq(&Mime::from_str("text/css").unwrap()));
///
/// // A mime type which is otherwise a subset with extra parameters is a subset of a mime type without those parameters
/// assert!(Mime::from_str("text/css;encoding=utf-8").unwrap().subset_eq(&Mime::from_str("text/css").unwrap()));
///
/// // A mime type more general than another mime type is not a subset
/// assert!(!Mime::from_str("*/css;encoding=utf-8").unwrap().subset_eq(&Mime::from_str("text/css").unwrap()));
/// ```
pub fn subset_eq(&self, other: &Mime) -> bool {
if other.basetype() != "*" && self.basetype() != other.basetype() {
return false;
}
if other.subtype() != "*" && self.subtype() != other.subtype() {
return false;
}
for (name, value) in other.params.iter() {
if !self
.param(name.clone())
.map(|v| v == value)
.unwrap_or(false)
{
return false;
}
}
true
}
}
impl Display for Mime {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
parse::format(self, f)
}
}
// impl Debug for Mime {
// fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
// Debug::fmt(&self.essence, f)
// }
// }
impl FromStr for Mime {
type Err = crate::Error;
/// Create a new `Mime`.
///
/// Follows the [WHATWG MIME parsing algorithm](https://mimesniff.spec.whatwg.org/#parsing-a-mime-type).
fn from_str(s: &str) -> Result<Self, Self::Err> {
parse::parse(s)
}
}
impl<'a> From<&'a str> for Mime {
fn from(value: &'a str) -> Self {
Self::from_str(value).unwrap()
}
}
impl ToHeaderValues for Mime {
type Iter = option::IntoIter<HeaderValue>;
fn to_header_values(&self) -> crate::Result<Self::Iter> {
let mime = self.clone();
let header: HeaderValue = mime.into();
// A HeaderValue will always convert into itself.
Ok(header.to_header_values().unwrap())
}
}
/// A parameter name.
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
pub struct ParamName(Cow<'static, str>);
impl ParamName {
/// Get the name as a `&str`
pub fn as_str(&self) -> &str {
&self.0
}
}
impl Display for ParamName {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
Display::fmt(&self.0, f)
}
}
impl FromStr for ParamName {
type Err = crate::Error;
/// Create a new `HeaderName`.
///
/// This checks it's valid ASCII, and lowercases it.
fn from_str(s: &str) -> Result<Self, Self::Err> {
crate::ensure!(s.is_ascii(), "String slice should be valid ASCII");
Ok(ParamName(Cow::Owned(s.to_ascii_lowercase())))
}
}
impl<'a> From<&'a str> for ParamName {
fn from(value: &'a str) -> Self {
Self::from_str(value).unwrap()
}
}
/// A parameter value.
#[derive(Debug, Clone, PartialEq, Eq, Hash)]
pub struct ParamValue(Cow<'static, str>);
impl ParamValue {
/// Get the value as a `&str`
pub fn as_str(&self) -> &str {
&self.0
}
}
impl Display for ParamValue {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
Display::fmt(&self.0, f)
}
}
impl<'a> PartialEq<&'a str> for ParamValue {
fn eq(&self, other: &&'a str) -> bool {
&self.0 == other
}
}
impl PartialEq<str> for ParamValue {
fn eq(&self, other: &str) -> bool {
self.0 == other
}
}