File: urlparse.ml

package info (click to toggle)
zeroinstall-injector 2.18-2.2
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 3,500 kB
  • sloc: ml: 26,524; xml: 2,700; ansic: 319; sh: 236; makefile: 133; python: 105
file content (65 lines) | stat: -rw-r--r-- 2,182 bytes parent folder | download | duplicates (5)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
(* Copyright (C) 2013, Thomas Leonard
 * See the README file for details, or visit http://0install.net.
 *)

let rec norm_url_path base rel =
  match base, rel with
  | base, [] -> base
  | base, "" :: rel -> norm_url_path base rel
  | base, "." :: rel -> norm_url_path base rel
  | _ :: base, ".." :: rel -> norm_url_path base rel
  | base, next :: rel -> norm_url_path (next :: base) rel

let re_url = Str.regexp "\\([a-zA-Z]+://[^/]*\\)\\(/.*\\)?"

let split_path url =
  if Str.string_match re_url url 0 then (
    let netloc = Str.matched_group 1 url in
    let path =
      try Str.matched_group 2 url
      with Not_found -> "/" in
    (netloc, path)
  ) else (
    Safe_exn.failf "Invalid base URL '%s'" url
  )

(* foo?bar -> ("foo", "?bar") *)
let split_query path =
  try
    let i = String.index path '?' in
    (String.sub path 0 i, XString.tail path i)
  with Not_found -> (path, "")

let join_url base rel =
  if List.exists (XString.starts_with rel) ["http://"; "https://"; "ftp://"] then (
    (* rel is absolute *)
    rel     
  ) else if XString.starts_with rel "//" then (
    (* https://example.com + //dl.example.com/foo -> https://dl.example.com/foo *)
    let i = String.index base ':' in
    String.sub base 0 (i + 1) ^ rel
  ) else (
    let base_netloc, base_path = split_path base in
    if XString.starts_with rel "/" then (
      (* http://example.com/* + /foo -> http://example.com/foo *)
      base_netloc ^ rel
    ) else (
      (* Split off query strings (?...) *)
      let base_path, _base_query = split_query base_path in
      let rel_path, rel_query = split_query rel in

      (* Base dir/path.xml -> dir *)
      let last_base_slash = String.rindex base_path '/' in
      let base_path =
        if last_base_slash < 2 then ""
        else String.sub base_path 1 (last_base_slash - 1) in

      (* Join paths *)
      let base_parts = Str.split_delim XString.re_slash base_path in 
      let rel_parts = Str.split_delim XString.re_slash rel_path in 
      let norm_path = rel_parts |> norm_url_path (List.rev base_parts) in

      (* Reattach query *)
      base_netloc ^ "/" ^ String.concat "/" (List.rev norm_path) ^ rel_query
    )
  )