File: parser.ml

package info (click to toggle)
yojson 2.2.2-1
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid, trixie
  • size: 2,216 kB
  • sloc: ml: 3,890; makefile: 28
file content (105 lines) | stat: -rw-r--r-- 3,742 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
open Let_syntax.Result

let parser_error pos error =
  let location = Errors.string_of_position pos in
  let msg = Printf.sprintf "%s: %s" location error in
  Error msg

let rec parse_list acc = function
  | [] -> Error "Unexpected end of input"
  | [ (Lexer.EOF, pos) ] -> parser_error pos "Unexpected end of input"
  | (Lexer.CLOSE_BRACKET, _) :: xs -> Ok (acc, xs)
  | xs -> (
      let* v, xs = parse xs in
      match xs with
      | [] -> Error "Unexpected end of input"
      | [ (Lexer.EOF, pos) ] -> parser_error pos "Unexpected end of input"
      | (Lexer.CLOSE_BRACKET, _) :: xs | (COMMA, _) :: (CLOSE_BRACKET, _) :: xs
        ->
          Ok (v :: acc, xs)
      | (COMMA, _) :: xs -> parse_list (v :: acc) xs
      | (x, pos) :: _ ->
          let s =
            Format.asprintf "Unexpected list token: %a" Lexer.pp_token x
          in
          parser_error pos s)

and parse_assoc acc = function
  | [] -> Error "Unexpected end of input"
  | [ (Lexer.EOF, pos) ] -> parser_error pos "Unexpected end of input"
  | (CLOSE_BRACE, _) :: xs -> Ok (acc, xs)
  | (STRING k, _) :: xs | (IDENTIFIER_NAME k, _) :: xs -> (
      match xs with
      | [] -> Error "Unexpected end of input"
      | [ (Lexer.EOF, pos) ] -> parser_error pos "Unexpected end of input"
      | (Lexer.COLON, _) :: xs -> (
          let* v, xs = parse xs in
          let item = (k, v) in
          match xs with
          | [] -> Error "Unexpected end of input"
          | [ (Lexer.EOF, pos) ] -> parser_error pos "Unexpected end of input"
          | (CLOSE_BRACE, _) :: xs | (COMMA, _) :: (CLOSE_BRACE, _) :: xs ->
              Ok (item :: acc, xs)
          | (COMMA, _) :: xs -> parse_assoc (item :: acc) xs
          | (x, pos) :: _ ->
              let s =
                Format.asprintf "Unexpected assoc list token: %a" Lexer.pp_token
                  x
              in
              parser_error pos s)
      | (x, pos) :: _ ->
          let s =
            Format.asprintf "Expected %a but found %a" Lexer.pp_token
              Lexer.COLON Lexer.pp_token x
          in
          parser_error pos s)
  | (x, pos) :: _ ->
      let s =
        Format.asprintf "Expected string or identifier but found %a"
          Lexer.pp_token x
      in
      parser_error pos s

and parse = function
  | [] -> Error "Unexpected end of input"
  | [ (Lexer.EOF, pos) ] -> parser_error pos "Unexpected end of input"
  | (token, pos) :: xs -> (
      match token with
      | TRUE -> Ok (Ast.Bool true, xs)
      | FALSE -> Ok (Bool false, xs)
      | NULL -> Ok (Null, xs)
      | INT v -> Ok (IntLit v, xs)
      | FLOAT v -> Ok (FloatLit v, xs)
      | INT_OR_FLOAT v -> Ok (FloatLit v, xs)
      | STRING s -> Ok (StringLit s, xs)
      | OPEN_BRACKET ->
          let+ l, xs = parse_list [] xs in
          (Ast.List (List.rev l), xs)
      | OPEN_BRACE ->
          let+ a, xs = parse_assoc [] xs in
          (Ast.Assoc (List.rev a), xs)
      | x ->
          let s = Format.asprintf "Unexpected token: %a" Lexer.pp_token x in
          parser_error pos s)

let parse_from_lexbuf ?(fname = "") ?(lnum = 1) lexbuffer =
  Sedlexing.set_filename lexbuffer fname;
  let pos =
    { Lexing.pos_fname = fname; pos_lnum = lnum; pos_bol = 0; pos_cnum = 0 }
  in
  Sedlexing.set_position lexbuffer pos;
  let* tokens = Lexer.lex [] lexbuffer in
  let+ ast, _unparsed = parse tokens in
  ast

let parse_from_string ?fname ?lnum input =
  parse_from_lexbuf (Sedlexing.Utf8.from_string input) ?fname ?lnum

let parse_from_channel ?fname ?lnum ic =
  parse_from_lexbuf (Sedlexing.Utf8.from_channel ic) ?fname ?lnum

let parse_from_file ?fname ?lnum filename =
  let ic = open_in filename in
  let out = parse_from_channel ?fname ?lnum ic in
  close_in ic;
  out