1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
#![recursion_limit = "100"]
#[macro_use]
extern crate lazy_static;
extern crate regex;
pub mod dataset;
pub mod parser;
pub mod woothee;
use parser::{Parser, WootheeResult};
pub fn is_crawler(agent: &str) -> bool {
if agent.is_empty() || agent == "-" {
return false;
}
let parser = Parser::new();
let mut result = WootheeResult::new();
parser.try_crawler(agent, &mut result)
}
#[cfg(test)]
mod tests {
use super::{is_crawler, Parser, WootheeResult};
fn get_woothee_result(agent: &str) -> WootheeResult {
Parser::new().parse(agent).expect("fail parse()")
}
#[test]
fn test_parser_lifetime() {
let agent = "Mozilla/5.0 (Macintosh; Intel Mac OS X 10.7; rv:21.0) Gecko/20100101 Firefox/21.0";
let result = get_woothee_result(agent);
assert_eq!(result.name, "Firefox");
assert_eq!(result.version, "21.0");
}
#[test]
fn test_is_crawler_smoke() {
assert!(!is_crawler(
"Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0)"
));
assert!(is_crawler(
"Mozilla/5.0 (compatible; Yahoo! Slurp; \
http://help.yahoo.com/help/us/ysearch/slurp)"
));
}
}