1
0
mirror of https://github.com/actix/actix-extras.git synced 2024-11-28 09:42:40 +01:00
actix-extras/src/recognizer.rs

310 lines
9.2 KiB
Rust
Raw Normal View History

2017-10-17 04:21:24 +02:00
use std::rc::Rc;
use std::collections::HashMap;
use regex::{Regex, RegexSet, Captures};
#[doc(hidden)]
pub struct RouteRecognizer<T> {
prefix: usize,
patterns: RegexSet,
routes: Vec<(Pattern, T)>,
}
2017-10-24 04:28:23 +02:00
impl<T> Default for RouteRecognizer<T> {
fn default() -> Self {
RouteRecognizer {
prefix: 0,
patterns: RegexSet::new([""].iter()).unwrap(),
routes: Vec::new(),
}
}
}
2017-10-17 04:21:24 +02:00
impl<T> RouteRecognizer<T> {
2017-10-24 04:28:23 +02:00
2017-11-27 02:30:35 +01:00
pub fn new<P: Into<String>, U>(prefix: P, routes: U) -> Self
where U: IntoIterator<Item=(String, T)>
{
2017-10-17 04:21:24 +02:00
let mut paths = Vec::new();
let mut handlers = Vec::new();
for item in routes {
let pat = parse(&item.0);
handlers.push((Pattern::new(&pat), item.1));
paths.push(pat);
};
let regset = RegexSet::new(&paths);
RouteRecognizer {
2017-11-27 02:30:35 +01:00
prefix: prefix.into().len() - 1,
2017-10-17 04:21:24 +02:00
patterns: regset.unwrap(),
routes: handlers,
}
}
2017-10-24 04:28:23 +02:00
pub fn set_routes(&mut self, routes: Vec<(&str, T)>) {
let mut paths = Vec::new();
let mut handlers = Vec::new();
for item in routes {
let pat = parse(item.0);
handlers.push((Pattern::new(&pat), item.1));
paths.push(pat);
};
self.patterns = RegexSet::new(&paths).unwrap();
self.routes = handlers;
}
2017-11-27 02:30:35 +01:00
pub fn set_prefix<P: Into<String>>(&mut self, prefix: P) {
let p = prefix.into();
2017-10-28 04:26:53 +02:00
if p.ends_with('/') {
self.prefix = p.len() - 1;
} else {
self.prefix = p.len();
}
2017-10-24 04:28:23 +02:00
}
2017-10-17 04:21:24 +02:00
pub fn recognize(&self, path: &str) -> Option<(Option<Params>, &T)> {
2017-10-28 04:26:53 +02:00
let p = &path[self.prefix..];
if p.is_empty() {
if let Some(idx) = self.patterns.matches("/").into_iter().next() {
let (ref pattern, ref route) = self.routes[idx];
return Some((pattern.match_info(&path[self.prefix..]), route))
}
} else if let Some(idx) = self.patterns.matches(p).into_iter().next() {
2017-10-17 04:21:24 +02:00
let (ref pattern, ref route) = self.routes[idx];
2017-10-28 04:26:53 +02:00
return Some((pattern.match_info(&path[self.prefix..]), route))
2017-10-17 04:21:24 +02:00
}
2017-10-28 04:26:53 +02:00
None
2017-10-17 04:21:24 +02:00
}
}
struct Pattern {
re: Regex,
names: Rc<HashMap<String, usize>>,
}
impl Pattern {
fn new(pattern: &str) -> Self {
let re = Regex::new(pattern).unwrap();
let names = re.capture_names()
.enumerate()
.filter_map(|(i, name)| name.map(|name| (name.to_owned(), i)))
.collect();
Pattern {
re,
names: Rc::new(names),
}
}
fn match_info(&self, text: &str) -> Option<Params> {
let captures = match self.re.captures(text) {
Some(captures) => captures,
None => return None,
};
2017-11-27 02:30:35 +01:00
Some(Params::new(Rc::clone(&self.names), text, &captures))
2017-10-17 04:21:24 +02:00
}
}
pub(crate) fn check_pattern(path: &str) {
if let Err(err) = Regex::new(&parse(path)) {
panic!("Wrong path pattern: \"{}\" {}", path, err);
}
}
fn parse(pattern: &str) -> String {
const DEFAULT_PATTERN: &str = "[^/]+";
2017-10-17 04:21:24 +02:00
2017-12-01 00:48:09 +01:00
let mut hard_stop = false;
2017-10-17 04:21:24 +02:00
let mut re = String::from("^/");
let mut in_param = false;
let mut in_param_pattern = false;
let mut param_name = String::new();
let mut param_pattern = String::from(DEFAULT_PATTERN);
for (index, ch) in pattern.chars().enumerate() {
// All routes must have a leading slash so its optional to have one
if index == 0 && ch == '/' {
continue;
}
2017-12-01 00:48:09 +01:00
if hard_stop {
2017-12-01 04:01:25 +01:00
panic!("Tail '*' section has to be last lection of pattern");
2017-12-01 00:48:09 +01:00
}
2017-10-17 04:21:24 +02:00
if in_param {
// In parameter segment: `{....}`
if ch == '}' {
2017-12-01 00:48:09 +01:00
if param_pattern == "*" {
hard_stop = true;
re.push_str(
&format!(r"(?P<{}>[%/[:word:][:punct:][:space:]]+)", &param_name));
} else {
re.push_str(&format!(r"(?P<{}>{})", &param_name, &param_pattern));
}
2017-10-17 04:21:24 +02:00
param_name.clear();
param_pattern = String::from(DEFAULT_PATTERN);
in_param_pattern = false;
in_param = false;
} else if ch == ':' {
// The parameter name has been determined; custom pattern land
in_param_pattern = true;
param_pattern.clear();
} else if in_param_pattern {
// Ignore leading whitespace for pattern
if !(ch == ' ' && param_pattern.is_empty()) {
param_pattern.push(ch);
}
} else {
param_name.push(ch);
}
} else if ch == '{' {
in_param = true;
} else {
re.push(ch);
}
}
re.push('$');
re
}
2017-10-17 05:13:47 +02:00
/// Route match information
///
/// If resource path contains variable patterns, `Params` stores this variables.
2017-10-17 04:21:24 +02:00
#[derive(Debug)]
pub struct Params {
text: String,
matches: Vec<Option<(usize, usize)>>,
names: Rc<HashMap<String, usize>>,
}
impl Params {
2017-10-19 08:43:50 +02:00
pub(crate) fn new(names: Rc<HashMap<String, usize>>,
text: &str,
2017-11-27 02:30:35 +01:00
captures: &Captures) -> Self
2017-10-17 04:21:24 +02:00
{
Params {
names,
text: text.into(),
matches: captures
.iter()
.map(|capture| capture.map(|m| (m.start(), m.end())))
.collect(),
}
}
pub(crate) fn empty() -> Self
{
Params {
text: String::new(),
names: Rc::new(HashMap::new()),
matches: Vec::new(),
}
}
2017-10-19 08:43:50 +02:00
pub fn is_empty(&self) -> bool {
self.names.is_empty()
}
2017-10-17 04:21:24 +02:00
fn by_idx(&self, index: usize) -> Option<&str> {
self.matches
.get(index + 1)
.and_then(|m| m.map(|(start, end)| &self.text[start..end]))
}
2017-10-17 05:13:47 +02:00
/// Get matched parameter by name
2017-10-17 04:21:24 +02:00
pub fn get(&self, key: &str) -> Option<&str> {
self.names.get(key).and_then(|&i| self.by_idx(i - 1))
}
}
2017-12-01 00:48:09 +01:00
#[cfg(test)]
mod tests {
use regex::Regex;
use super::*;
fn assert_parse(pattern: &str, expected_re: &str) -> Regex {
let re_str = parse(pattern);
assert_eq!(&*re_str, expected_re);
Regex::new(&re_str).unwrap()
}
#[test]
fn test_parse_static() {
let re = assert_parse("/", r"^/$");
assert!(re.is_match("/"));
assert!(!re.is_match("/a"));
let re = assert_parse("/name", r"^/name$");
assert!(re.is_match("/name"));
assert!(!re.is_match("/name1"));
assert!(!re.is_match("/name/"));
assert!(!re.is_match("/name~"));
let re = assert_parse("/name/", r"^/name/$");
assert!(re.is_match("/name/"));
assert!(!re.is_match("/name"));
assert!(!re.is_match("/name/gs"));
let re = assert_parse("/user/profile", r"^/user/profile$");
assert!(re.is_match("/user/profile"));
assert!(!re.is_match("/user/profile/profile"));
}
#[test]
fn test_parse_param() {
let re = assert_parse("/user/{id}", r"^/user/(?P<id>[^/]+)$");
assert!(re.is_match("/user/profile"));
assert!(re.is_match("/user/2345"));
assert!(!re.is_match("/user/2345/"));
assert!(!re.is_match("/user/2345/sdg"));
let captures = re.captures("/user/profile").unwrap();
assert_eq!(captures.get(1).unwrap().as_str(), "profile");
assert_eq!(captures.name("id").unwrap().as_str(), "profile");
let captures = re.captures("/user/1245125").unwrap();
assert_eq!(captures.get(1).unwrap().as_str(), "1245125");
assert_eq!(captures.name("id").unwrap().as_str(), "1245125");
let re = assert_parse(
"/v{version}/resource/{id}",
r"^/v(?P<version>[^/]+)/resource/(?P<id>[^/]+)$",
);
assert!(re.is_match("/v1/resource/320120"));
assert!(!re.is_match("/v/resource/1"));
assert!(!re.is_match("/resource"));
let captures = re.captures("/v151/resource/adahg32").unwrap();
assert_eq!(captures.get(1).unwrap().as_str(), "151");
assert_eq!(captures.name("version").unwrap().as_str(), "151");
assert_eq!(captures.name("id").unwrap().as_str(), "adahg32");
}
#[test]
fn test_tail_param() {
let re = assert_parse("/user/{tail:*}",
r"^/user/(?P<tail>[%/[:word:][:punct:][:space:]]+)$");
assert!(re.is_match("/user/profile"));
assert!(re.is_match("/user/2345"));
assert!(re.is_match("/user/2345/"));
assert!(re.is_match("/user/2345/sdg"));
assert!(re.is_match("/user/2345/sd-_g/"));
assert!(re.is_match("/user/2345/sdg/asddsasd/index.html"));
let re = assert_parse("/user/v{tail:*}",
r"^/user/v(?P<tail>[%/[:word:][:punct:][:space:]]+)$");
assert!(!re.is_match("/user/2345/"));
assert!(re.is_match("/user/vprofile"));
assert!(re.is_match("/user/v_2345"));
assert!(re.is_match("/user/v2345/sdg"));
assert!(re.is_match("/user/v2345/sd-_g/test.html"));
assert!(re.is_match("/user/v/sdg/asddsasd/index.html"));
}
}