@@ -35,7 +35,7 @@ vignette via `vignette("adaR")`.
3535 webtracking data
3636- [ domainator] ( https://github.com/schochastics/domainator ) : classify
3737 domains
38- - [ adaR] ( https://github.com/schochastics /adaR ) : parse urls
38+ - [ adaR] ( https://github.com/gesistsa /adaR ) : parse urls
3939
4040## Installation
4141
6161``` r
6262library(adaR )
6363ada_url_parse(" https://user_1:password_1@example.org:8080/dir/../api?q=1#frag" )
64- # > href
65- # > 1 https://user_1:password_1@example.org:8080/api?q=1#frag
66- # > protocol username password host
67- # > 1 https: user_1 password_1 example.org:8080
68- # > hostname port pathname search hash
69- # > 1 example.org 8080 /api ?q=1 #frag
64+ # > href protocol username
65+ # > 1 https://user_1:password_1@example.org:8080/api?q=1#frag https: user_1
66+ # > password host hostname port pathname search hash
67+ # > 1 password_1 example.org:8080 example.org 8080 /api ?q=1 #frag
7068```
7169
7270``` cpp
@@ -100,10 +98,8 @@ ada_url_parse("https://www.google.com/maps/place/Pennsylvania+Station/@40.751984
10098 5!3m4!1s0x89c259ae15b2adcb:0x7955420634fd7eba!8m2!3d40.750568!4d-73.993519" )
10199# > href
102100# > 1 https://www.google.com/maps/place/Pennsylvania+Station/@40.7519848,-74.0015045,14.7z/data=!4m 5!3m4!1s0x89c259ae15b2adcb:0x7955420634fd7eba!8m2!3d40.750568!4d-73.993519
103- # > protocol username password host
104- # > 1 https: www.google.com
105- # > hostname port
106- # > 1 www.google.com
101+ # > protocol username password host hostname port
102+ # > 1 https: www.google.com www.google.com
107103# > pathname
108104# > 1 /maps/place/Pennsylvania+Station/@40.7519848,-74.0015045,14.7z/data=!4m 5!3m4!1s0x89c259ae15b2adcb:0x7955420634fd7eba!8m2!3d40.750568!4d-73.993519
109105# > search hash
@@ -123,10 +119,10 @@ bench::mark(
123119 iterations = 1 , check = FALSE
124120)
125121# > # A tibble: 2 × 6
126- # > expression min median `itr/sec` mem_alloc `gc/sec`
127- # > <bch:expr> <bch:tm> <bch:t > <dbl> <bch:byt> <dbl>
128- # > 1 ada 458µs 458µs 2183 . 2.49KB 0
129- # > 2 urltools 421µs 421µs 2374 . 2.49KB 0
122+ # > expression min median `itr/sec` mem_alloc `gc/sec`
123+ # > <bch:expr> <bch:tm> <bch:tm > <dbl> <bch:byt> <dbl>
124+ # > 1 ada 227µs 227µs 4405 . 2.49KB 0
125+ # > 2 urltools 229µs 229µs 4373 . 2.49KB 0
130126```
131127
132128For further benchmark results, see ` benchmark.md ` in ` data_raw ` .
@@ -151,8 +147,7 @@ urls <- c(
151147 " https://thisisnotpart.butthisispartoftheps.kawasaki.jp"
152148)
153149public_suffix(urls )
154- # > [1] "co.uk"
155- # > [2] "gov.uk"
150+ # > [1] "co.uk" "gov.uk"
156151# > [3] "butthisispartoftheps.kawasaki.jp"
157152```
158153
0 commit comments