Added strings to tokenizer, added comments to code.

2026-03-19 09:03:58 +00:00 · 2015-10-09 11:29:52 +02:00
parent 25d691eb66
commit e88a6b48a8
6 changed files with 71 additions and 17 deletions
--- a/.gitignore
+++ b/.gitignore
@@ -0,0 +1,2 @@
 /bin/
 /pkg/
--- a/in/test.asl
+++ b/in/test.asl
@@ -0,0 +1,3 @@
 var _x = "This is a string!";
 var _y = "";
 var _z = "\"mask\"";
--- a/src/asl/parser.go
+++ b/src/asl/parser.go
@@ -6,6 +6,8 @@ import (
 const TAB = "    "
 // Parses tokens, validates code to a specific degree
 // and writes SQF code into desired location.
 func Parse(token []Token) string {
 	initParser(token)
--- a/src/asl/parserHelper.go
+++ b/src/asl/parserHelper.go
@@ -5,6 +5,7 @@ var tokenIndex int
 var out string
 var offset int
 // Initilizes the parser.
 func initParser(token []Token) {
 	if len(token) == 0 {
 		panic("No tokens provided")
@@ -16,10 +17,14 @@ func initParser(token []Token) {
 	offset = 0
 }
 // Returns true, if current token matches expected one.
 // Does not throw parse errors and checks if token is available.
 func accept(token string) bool {
 	return tokenIndex < len(tokens) && tokenEqual(token, get())
 }
 // Hard version of "accept".
 // Throws if current token does not match expected one.
 func expect(token string) {
 	if !tokenEqual(token, get()) {
 		panic("Parse error, expected '" + token + "' but was '" + get().token + "'")
@@ -28,10 +33,12 @@ func expect(token string) {
 	next()
 }
 // Increases token counter, so that the next token is compared.
 func next() {
 	tokenIndex++
 }
 // Returns current token or throws, if no more tokens are available.
 func get() Token {
 	if tokenIndex >= len(tokens) {
 		panic("No more tokens")
@@ -40,14 +47,17 @@ func get() Token {
 	return tokens[tokenIndex]
 }
 // Returns true if the end of input code was reached.
 func end() bool {
 	return tokenIndex == len(tokens)
 }
 // Checks if two strings match.
 func tokenEqual(a string, b Token) bool {
 	return a == b.token
 }
 // Appends the output string to current SQF code output.
 func appendOut(str string) {
 	out += str
 }
--- a/src/asl/tokenizer.go
+++ b/src/asl/tokenizer.go
@@ -42,34 +42,65 @@ var keywords = []string{
 var whitespace = []byte{' ', '\n', '\t'}
 // Tokenizes the given byte array into syntax tokens,
 // which can be parsed later.
 func Tokenize(code []byte) []Token {
 	code = removeComments(code)
 	tokens := make([]Token, 0)
-	token := ""
+	token, mask, isstring := "", false, false
-	fmt.Println(string(code))
+	fmt.Println("CODE:\n"+string(code)) // TODO: remove
 	for i := range code {
 		c := code[i]
-		if byteArrayContains(delimiter, c) {
+		// string masks (backslash)
-			if token != "" {
+		if c == '\\' && !mask {
-				tokens = append(tokens, Token{token})
+		    token += "\\"
-			}
+		    mask = true
-
+		    continue
 			tokens = append(tokens, Token{string(c)})
 			token = ""
 		} else if stringArrayContains(keywords, strings.ToLower(token)) {
 			tokens = append(tokens, Token{token})
 			token = ""
 		} else if !byteArrayContains(whitespace, c) {
 			token += string(c)
 		}
 		// string
 		if c == '"' && !mask {
 		    token += "\""
 		    isstring = !isstring
 		    continue
 		}
 		if isstring {
 		    token += string(c)
 		} else {
            // delimeter, keyword or variable/expression
    		if byteArrayContains(delimiter, c) {
    			if token != "" {
    				tokens = append(tokens, Token{token})
    			}
    			tokens = append(tokens, Token{string(c)})
    			token = ""
    		} else if stringArrayContains(keywords, strings.ToLower(token)) {
    			tokens = append(tokens, Token{token})
    			token = ""
    		} else if !byteArrayContains(whitespace, c) {
    			token += string(c)
    		}
 		}
 		mask = false
 	}
 	fmt.Println("TOKENS:") // TODO: remove
 	for t := range tokens {
 	    fmt.Println(tokens[t].token)
 	}
 	return tokens
 }
 // Removes all comments from input byte array.
 // Comments are single line comments, starting with // (two slashes),
 // multi line comments with /* ... */ (slash star, star slash).
 func removeComments(code []byte) []byte {
 	newcode := make([]byte, len(code))
 	j := 0
@@ -92,6 +123,8 @@ func removeComments(code []byte) []byte {
 	return newcode[:j]
 }
 // Returns the next character in code starting at i.
 // If no character is left, '0' will be returned.
 func nextChar(code []byte, i int) byte {
 	i++
@@ -102,6 +135,7 @@ func nextChar(code []byte, i int) byte {
 	return '0'
 }
 // Used to skip a line if a single line comment was found.
 func skipSingleLineComment(code []byte, i int) int {
 	for i < len(code) && code[i] != '\n' {
 		i++
@@ -110,6 +144,7 @@ func skipSingleLineComment(code []byte, i int) int {
 	return i
 }
 // Used to skip a block of characters if a multi line comment was found
 func skipMultiLineComment(code []byte, i int) int {
 	for i < len(code) && !(code[i] == '*' && nextChar(code, i) == '/') {
 		i++
@@ -118,6 +153,7 @@ func skipMultiLineComment(code []byte, i int) int {
 	return i + 1
 }
 // Checks if a byte array (string) contains a delimeter.
 func byteArrayContains(haystack []byte, needle byte) bool {
 	for i := range haystack {
 		if haystack[i] == needle {
@@ -128,6 +164,7 @@ func byteArrayContains(haystack []byte, needle byte) bool {
 	return false
 }
 // Checks if a byte array (string) contains a string delimeter.
 func stringArrayContains(haystack []string, needle string) bool {
 	for i := range haystack {
 		if haystack[i] == needle {
--- a/src/main/asl.go
+++ b/src/main/asl.go
@@ -8,9 +8,9 @@ import (
 func main() {
 	// read test file
-	code, _ := ioutil.ReadFile("in/simple.asl")
+	code, _ := ioutil.ReadFile("in/test.asl")
 	token := asl.Tokenize(code)
 	out := asl.Parse(token)
-	fmt.Println(out)
+	fmt.Println("OUTPUT:\n"+out) // TODO: remove
 }