aboutsummaryrefslogtreecommitdiff
path: root/go/src/reader/reader.go
blob: 55cea591fb25d7beba04037be57cb6edeb9af3e3 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
package reader

import (
    "errors"
    "regexp"
    "strconv"
    //"fmt"
)

import (
    "types"
)

type Reader interface {
    next() *string
    peek() *string
}

type TokenReader struct {
    tokens []string
    position int
}

func (tr *TokenReader) next() *string {
    if tr.position >= len(tr.tokens) { return nil }
    token := tr.tokens[tr.position]
    tr.position = tr.position + 1
    return &token
}

func (tr *TokenReader) peek() *string {
    if tr.position >= len(tr.tokens) { return nil }
    return &tr.tokens[tr.position]
}



func tokenize (str string) []string {
    results := make([]string, 0, 1)
    re := regexp.MustCompile(`[\s,]*(~@|[\[\]{}()'~^@]|"(?:\\.|[^\\"])*"|;.*|[^\s\[\]{}('",;)]*)`)
    for _, group := range re.FindAllStringSubmatch(str, -1) {
        if group[1] == "" { continue }
        results = append(results, group[1])
    }
    return results
}

func read_atom(rdr Reader) (types.MalType, error) {
    token := rdr.next()
    if token == nil { return nil, errors.New("read_atom underflow") }
    if match, _ := regexp.MatchString(`^-?[0-9]+$`, *token); match {
        var i int
        var e error
        if i, e = strconv.Atoi(*token); e != nil {
            return nil, errors.New("number parse error")
        }
        return i, nil
    } else if (*token)[0] == '"' {
        // TODO: unquote newline and quotes
        return (*token)[1:len(*token)-1], nil
    } else if *token == "nil" {
        return nil, nil
    } else if *token == "true" {
        return true, nil
    } else if *token == "false" {
        return false, nil
    } else {
        return types.Symbol{*token}, nil
    }
    return token, nil
}

func read_list(rdr Reader, start string, end string) (types.MalType, error) {
    token := rdr.next()
    if token == nil { return nil, errors.New("read_list underflow") }

    ast_list := []types.MalType{}
    if *token != start {
        return nil, errors.New("expected '" + start + "'")
    }
    token = rdr.peek()
    for ; true ; token = rdr.peek() {
        if token == nil { return nil, errors.New("exepected '" + end + "', got EOF") }
        if *token == end { break }
        f, e := read_form(rdr)
        if e != nil { return nil, e }
        ast_list = append(ast_list, f)
    }
    rdr.next()
    return types.List{ast_list}, nil
}

func read_vector(rdr Reader) (types.MalType, error) {
    lst, e := read_list(rdr, "[", "]")
    if e != nil { return nil, e }
    vec := types.Vector{lst.(types.List).Val}
    return vec, nil
}

func read_hash_map(rdr Reader) (types.MalType, error) {
    mal_lst, e := read_list(rdr, "{", "}")
    lst := mal_lst.(types.List).Val
    if e != nil { return nil, e }
    if len(lst) % 2 == 1 {
        return nil, errors.New("Odd number of hash map arguments")
    }
    m := map[string]types.MalType{}
    for i := 0; i < len(lst); i+=2 {
        str, ok := lst[i].(string)
        if !ok {
            return nil, errors.New("expected hash-map key string")
        }
        m[str] = lst[i+1]
    }
    return m, nil
}

func read_form(rdr Reader) (types.MalType, error) {
    token := rdr.peek()
    if token == nil { return nil, errors.New("read_form underflow") }
    switch (*token) {
    // list
    case ")": return nil, errors.New("unexpected ')'")
    case "(": return read_list(rdr, "(", ")")

    // vector
    case "]": return nil, errors.New("unexpected ']'")
    case "[": return read_vector(rdr)

    // hash-map
    case "}": return nil, errors.New("unexpected '}'")
    case "{": return read_hash_map(rdr)
    default:  return read_atom(rdr)
    }
    return read_atom(rdr)
}

func Read_str(str string) (types.MalType, error) {
    var tokens = tokenize(str);
    if len(tokens) == 0 {
        return nil, errors.New("<empty line>")
    }

    return read_form(&TokenReader{tokens: tokens, position: 0})
}