urlencoding/dec.rs
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93
use std::borrow::Cow;
use std::string::FromUtf8Error;
#[inline]
pub(crate) fn from_hex_digit(digit: u8) -> Option<u8> {
match digit {
b'0'..=b'9' => Some(digit - b'0'),
b'A'..=b'F' => Some(digit - b'A' + 10),
b'a'..=b'f' => Some(digit - b'a' + 10),
_ => None,
}
}
/// Decode percent-encoded string assuming UTF-8 encoding.
///
/// If you need a `String`, call `.into_owned()` (not `.to_owned()`).
///
/// Unencoded `+` is preserved literally, and _not_ changed to a space.
pub fn decode(data: &str) -> Result<Cow<str>, FromUtf8Error> {
match decode_binary(data.as_bytes()) {
Cow::Borrowed(_) => Ok(Cow::Borrowed(data)),
Cow::Owned(s) => Ok(Cow::Owned(String::from_utf8(s)?)),
}
}
/// Decode percent-encoded string as binary data, in any encoding.
///
/// Unencoded `+` is preserved literally, and _not_ changed to a space.
pub fn decode_binary(mut data: &[u8]) -> Cow<[u8]> {
let mut decoded: Vec<u8> = Vec::with_capacity(data.len());
let mut out = NeverRealloc(&mut decoded);
loop {
let mut parts = data.splitn(2, |&c| c == b'%');
// first the decoded non-% part
let non_escaped_part = parts.next().unwrap();
let rest = parts.next();
if rest.is_none() && out.0.is_empty() {
// if empty there were no '%' in the string
return data.into();
}
out.extend_from_slice(non_escaped_part);
// then decode one %xx
match rest {
Some(rest) => match rest.get(0..2) {
Some(&[first, second]) => match from_hex_digit(first) {
Some(first_val) => match from_hex_digit(second) {
Some(second_val) => {
out.push((first_val << 4) | second_val);
data = &rest[2..];
},
None => {
out.extend_from_slice(&[b'%', first]);
data = &rest[1..];
},
},
None => {
out.push(b'%');
data = rest;
},
},
_ => {
// too short
out.push(b'%');
out.extend_from_slice(rest);
break;
},
},
None => break,
}
}
Cow::Owned(decoded)
}
struct NeverRealloc<'a, T>(pub &'a mut Vec<T>);
impl<T> NeverRealloc<'_, T> {
#[inline]
pub fn push(&mut self, val: T) {
// these branches only exist to remove redundant reallocation code
// (the capacity is always sufficient)
if self.0.len() != self.0.capacity() {
self.0.push(val);
}
}
#[inline]
pub fn extend_from_slice(&mut self, val: &[T]) where T: Clone {
if self.0.capacity() - self.0.len() >= val.len() {
self.0.extend_from_slice(val);
}
}
}