aboutsummaryrefslogtreecommitdiff
path: root/src/runMain/kotlin/Lexical.kt
blob: dbf2bad7f28a29e023704869c5caf3a6fc220d51 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
import TokenType.*
import exceptions.*

class Lexical {
    /**
     * Analyzes the given [source] and returns the tokens divided into an array of statements
     * TODO: Add line number to token (abstract to class?)
     */
    fun analyze(source: String): MutableList<MutableList<Pair<String, TokenType>>> {
        var buffer = ""
        var skipStatementEnd = false
        var statementEnd: Boolean
        val statements = mutableListOf<MutableList<Pair<String, TokenType>>>()
        val currentStatement = mutableListOf<Pair<String, TokenType>>()
        for (i in source.indices) {
            buffer += source[i]
            if (source[i] == '"') skipStatementEnd = !skipStatementEnd
            statementEnd = source[i] == ';' && !skipStatementEnd
            val tokenType = getTokenType(buffer, if (source.length > i + 1) source[i + 1] else ' ')
            if (tokenType != Skip && !statementEnd) {
                currentStatement.add(buffer to tokenType)
                buffer = ""
            } else if (statementEnd) {
                statements.add(currentStatement.toMutableList())
                currentStatement.clear()
                buffer = ""
            }
        }
        return statements
    }

    /**
     * Matches the tokens to a [TokenType]
     */
    private fun getTokenType(token: String, next: Char): TokenType {
        return when {
            token + next in keyword -> Skip
            token in keyword -> Keyword

            token + next in comparison -> Skip
            token in assignment -> Assignment

            token + next in assignment -> Skip
            token in arithmetic -> Arithmetic

            token + next in comparison -> Skip
            token in comparison -> Comparison

            token + next in comparison -> Skip
            token in logical -> Logical

            (token + next).matches(Regex("[a-zA-Z]*")) -> Skip
            token.matches(Regex("[a-zA-Z]*")) -> Identifier

            (token + next).matches(Regex("[0-9]*")) -> Skip
            token.matches(Regex("[0-9]*")) -> Constant

            token in emptiness && token.length > 1 -> throw UnknownType(token)
            token in emptiness -> Empty

            token in punctuation -> Punctuation

            token in brackets -> Bracket

            token in classifier -> Classifier

            else -> Skip
        }
    }

    private val keyword = listOf("print") // TODO: DataType matching
    private val assignment = listOf("=", "+=", "-=", "*=", "/*")
    private val arithmetic = listOf("+", "-", "*", "/", "%")
    private val comparison = listOf("==", "!=", "<", "<=", ">", ">=")
    private val logical = listOf("&&", "||", "!")
    private val punctuation = listOf(",", ":", ".", ";")
    private val brackets = listOf("(", ")", "[", "]", "{", "}") // TODO: Use brackets for functions
    private val classifier = listOf("\"", "'")
    private val emptiness = listOf(" ", "\t")
}