Set of test case for woothee project. Project Woothee is multi-language user-agent strings parsers.
Project Woothee is multi-language user-agent strings parsers., (*1)
You can try it on demo site: http://woothee.github.io/, (*2)
We needs just same logic over 2 or more programming languages, for use on various frameworks, middlewares and environments., (*3)
Most important data of this project is only single set of return values, and set of test cases, for equality of results of another languages implementations., (*4)
Implementations:, (*5)
Version numbers are used as: * vX.Y.Z * X and Y is major/minor number to control specs of dataset/testsets * Z is patch number for each language implementation release control * Z is also used for bug fix control of testsets (versions of each language implementations should be bumped up too), (*6)
in Java: (use java/woothee.jar), (*7)
// import is.tagomor.woothee.Classifier; // import is.tagomor.woothee.DataSet; Map r = Classifier.parse("user agent string"); r.get("name") // => name of browser (or string like name of user-agent) r.get("category") // => "pc", "smartphone", "mobilephone", "appliance", "crawler", "misc", "unknown" r.get("os") // => os from user-agent, or carrier name of mobile phones r.get("version"); // => version of browser, or terminal type name of mobile phones r.get("os_version"); // => "NT 6.3" (for Windows), "10.8.3" (for OSX), "8.0.1" (for iOS), ....
in Hive: (copy woothee.jar into your CLASSPATH, and create function), (*8)
-- add jar to classpath add jar woothee.jar; -- create function CREATE TEMPORARY FUNCTION parse_agent as 'is.tagomor.woothee.hive.ParseAgent'; -- count visits of bots SELECT parsed_agent['name'] AS botname, COUNT(*) AS cnt FROM ( SELECT parse_agent(user_agent) AS parsed_agent FROM table_name WHERE date='today' ) x WHERE parsed_agent['category'] = 'crawler' GROUP BY parsed_agent['name'] ORDER BY cnt DESC LIMIT 1000;
in Perl: (cpanm Woothee), (*9)
use Woothee; Woothee::parse("Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0)"); # => {'name'=>"Internet Explorer", 'category'=>"pc", 'os'=>"Windows 7", 'version'=>"8.0", 'vendor'=>"Microsoft", 'os_version'=>"NT 6.1"}
in Ruby: (gem install woothee), (*10)
require 'woothee' Woothee.parse("Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0)") # => {:name=>"Internet Explorer", :category=>:pc, :os=>"Windows 7", :version=>"8.0", :vendor=>"Microsoft", :os_version=>"NT 6.1"}
in Python:, (*11)
import woothee woothee.parse("Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0)") # => {'name': 'Internet Explorer', 'category': 'pc', 'os': 'Windows 7', 'version': '8.0', 'vendor': 'Microsoft'}
in Javascript(HTML, copy from release/woothee.js), (*12)
<script src="./your/own/path/woothee.js"></script> <script> woothee.parse('Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0)') // => {name: 'Internet Explorer', category: 'pc', os: 'Windows 7', version: '8.0', vendor: 'Microsoft', os_version: 'NT 6.1'} </script>
in Node.js (npm install woothee), (*13)
var woothee = require('woothee'); woothee.parse('Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0)') // => {name: 'Internet Explorer', category: 'pc', os: 'Windows 7', version: '8.0', vendor: 'Microsoft', os_version: 'NT 6.1'}
in PHP (composer require woothee/woothee:*), (*14)
<?php include __DIR__ . '/vendor/autoload.php'; $classifier = new \Woothee\Classifier; $classifier->parse('Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0)'); // => ['name' => 'Internet Explorer', 'category' => 'pc', 'os' => 'Windows 7', 'version' => '8.0', 'vendor' => 'Microsoft']
in Rust:, (*15)
extern crate woothee; use woothee::parser::Parser; fn main() { let parser = Parser::new(); let result = parser.parse("Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.1; Trident/4.0)"); println!("{:?}", result); } // => Some(WootheeResult { name: "Internet Explorer", category: "pc", os: "Windows 7", os_version: "NT 6.1", browser_type: "UNKNOWN", version: "8.0", vendor: "Microsoft" })
Copyright 2012- TAGOMORI Satoshi (tagomoris), (*16)
Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at, (*17)
http://www.apache.org/licenses/LICENSE-2.0, (*18)
Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License., (*19)