use crate::error::{Error, ErrorKind};
use std::fmt;
use std::str::{from_utf8, FromStr};
#[derive(Debug, Clone, PartialEq, Eq)]
pub(crate) struct HeaderLine(Vec<u8>);
impl From<String> for HeaderLine {
fn from(s: String) -> Self {
HeaderLine(s.into_bytes())
}
}
impl From<Vec<u8>> for HeaderLine {
fn from(b: Vec<u8>) -> Self {
HeaderLine(b)
}
}
impl HeaderLine {
pub fn into_string_lossy(self) -> String {
String::from_utf8(self.0)
.unwrap_or_else(|e| String::from_utf8_lossy(&e.into_bytes()).to_string())
}
pub fn is_empty(&self) -> bool {
self.0.is_empty()
}
fn as_bytes(&self) -> &[u8] {
&self.0
}
pub fn into_header(self) -> Result<Header, Error> {
let mut index = 0;
for c in self.as_bytes() {
if *c == b':' {
break;
}
if !is_tchar(c) {
return Err(Error::new(
ErrorKind::BadHeader,
Some(format!("Invalid char ({:0x?}) while looking for ':'", *c)),
));
}
index += 1;
}
Ok(Header { line: self, index })
}
}
impl fmt::Display for HeaderLine {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
write!(f, "{}", String::from_utf8_lossy(&self.0))
}
}
#[derive(Clone, PartialEq, Eq)]
pub(crate) struct Header {
line: HeaderLine,
index: usize,
}
impl fmt::Debug for Header {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
write!(f, "{}", self.line)
}
}
impl Header {
pub fn new(name: &str, value: &str) -> Self {
let line = format!("{}: {}", name, value).into();
let index = name.len();
Header { line, index }
}
pub fn name(&self) -> &str {
let bytes = &self.line.as_bytes()[0..self.index];
from_utf8(bytes).expect("Legal chars in header name")
}
pub fn value(&self) -> Option<&str> {
let bytes = &self.line.as_bytes()[self.index + 1..];
from_utf8(bytes)
.map(|s| s.trim())
.ok()
.filter(|s| s.as_bytes().iter().all(is_field_vchar_or_obs_fold))
}
#[allow(unused)]
pub fn value_raw(&self) -> &[u8] {
let mut bytes = &self.line.as_bytes()[self.index + 1..];
if !bytes.is_empty() {
while !bytes.is_empty() && bytes[0].is_ascii_whitespace() {
bytes = &bytes[1..];
}
while !bytes.is_empty() && bytes[bytes.len() - 1].is_ascii_whitespace() {
bytes = &bytes[..(bytes.len() - 1)];
}
}
bytes
}
pub fn is_name(&self, other: &str) -> bool {
self.name().eq_ignore_ascii_case(other)
}
pub(crate) fn validate(&self) -> Result<(), Error> {
let bytes = self.line.as_bytes();
let name_raw = &bytes[0..self.index];
let value_raw = &bytes[self.index + 1..];
if !valid_name(name_raw) || !valid_value(value_raw) {
Err(ErrorKind::BadHeader.msg(format!("invalid header '{}'", self.line)))
} else {
Ok(())
}
}
}
pub(crate) fn get_header<'h>(headers: &'h [Header], name: &str) -> Option<&'h str> {
headers
.iter()
.find(|h| h.is_name(name))
.and_then(|h| h.value())
}
#[allow(unused)]
pub(crate) fn get_header_raw<'h>(headers: &'h [Header], name: &str) -> Option<&'h [u8]> {
headers
.iter()
.find(|h| h.is_name(name))
.map(|h| h.value_raw())
}
pub(crate) fn get_all_headers<'h>(headers: &'h [Header], name: &str) -> Vec<&'h str> {
headers
.iter()
.filter(|h| h.is_name(name))
.filter_map(|h| h.value())
.collect()
}
pub(crate) fn has_header(headers: &[Header], name: &str) -> bool {
get_header(headers, name).is_some()
}
pub(crate) fn add_header(headers: &mut Vec<Header>, header: Header) {
let name = header.name();
if !name.starts_with("x-") && !name.starts_with("X-") {
headers.retain(|h| h.name() != name);
}
headers.push(header);
}
fn valid_name(name: &[u8]) -> bool {
!name.is_empty() && name.iter().all(is_tchar)
}
#[inline]
pub(crate) fn is_tchar(b: &u8) -> bool {
match b {
b'!' | b'#' | b'$' | b'%' | b'&' => true,
b'\'' | b'*' | b'+' | b'-' | b'.' => true,
b'^' | b'_' | b'`' | b'|' | b'~' => true,
b if b.is_ascii_alphanumeric() => true,
_ => false,
}
}
fn valid_value(value: &[u8]) -> bool {
value.iter().all(is_field_vchar_or_obs_fold)
}
#[inline]
fn is_field_vchar_or_obs_fold(b: &u8) -> bool {
match b {
b' ' | b'\t' => true,
0x21..=0x7E => true,
_ => false,
}
}
impl FromStr for Header {
type Err = Error;
fn from_str(s: &str) -> Result<Self, Self::Err> {
let line: HeaderLine = s.to_string().into();
let header = line.into_header()?;
header.validate()?;
Ok(header)
}
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn test_valid_name() {
assert!(valid_name(b"example"));
assert!(valid_name(b"Content-Type"));
assert!(valid_name(b"h-123456789"));
assert!(!valid_name(b"Content-Type:"));
assert!(!valid_name(b"Content-Type "));
assert!(!valid_name(b" some-header"));
assert!(!valid_name(b"\"invalid\""));
assert!(!valid_name(b"G\xf6del"));
}
#[test]
fn test_valid_value() {
assert!(valid_value(b"example"));
assert!(valid_value(b"foo bar"));
assert!(valid_value(b" foobar "));
assert!(valid_value(b" foo\tbar "));
assert!(valid_value(b" foo~"));
assert!(valid_value(b" !bar"));
assert!(valid_value(b" "));
assert!(!valid_value(b" \nfoo"));
assert!(!valid_value(b"foo\x7F"));
}
#[test]
fn test_parse_invalid_name() {
let cases = vec![
"Content-Type :",
" Content-Type: foo",
"Content-Type foo",
"\"some-header\": foo",
"Gödel: Escher, Bach",
"Foo: \n",
"Foo: \nbar",
"Foo: \x7F bar",
];
for c in cases {
let result = c.parse::<Header>();
assert!(
matches!(result, Err(ref e) if e.kind() == ErrorKind::BadHeader),
"'{}'.parse(): expected BadHeader, got {:?}",
c,
result
);
}
}
#[test]
#[cfg(feature = "charset")]
fn test_parse_non_utf8_value() {
let (cow, _, _) = encoding_rs::WINDOWS_1252.encode("x-geo-stuff: älvsjö ");
let bytes = cow.to_vec();
let line: HeaderLine = bytes.into();
let header = line.into_header().unwrap();
assert_eq!(header.name(), "x-geo-stuff");
assert_eq!(header.value(), None);
assert_eq!(header.value_raw(), [228, 108, 118, 115, 106, 246]);
}
#[test]
fn empty_value() {
let h = "foo:".parse::<Header>().unwrap();
assert_eq!(h.value(), Some(""));
}
#[test]
fn value_with_whitespace() {
let h = "foo: bar ".parse::<Header>().unwrap();
assert_eq!(h.value(), Some("bar"));
}
#[test]
fn name_and_value() {
let header: Header = "X-Forwarded-For: 127.0.0.1".parse().unwrap();
assert_eq!("X-Forwarded-For", header.name());
assert_eq!(header.value(), Some("127.0.0.1"));
assert!(header.is_name("X-Forwarded-For"));
assert!(header.is_name("x-forwarded-for"));
assert!(header.is_name("X-FORWARDED-FOR"));
}
#[test]
fn test_iso8859_utf8_mixup() {
let b = "header: \0xc2\0xa5".to_string().into_bytes();
let l: HeaderLine = b.into();
let h = l.into_header().unwrap();
assert_eq!(h.value(), None);
}
}