13 changed files with 251 additions and 395 deletions
--- a/.gitignore
+++ b/.gitignore
@ -1 +1,2 @@
-kg/kg
+re
+
--- a/8
+++ b/8
@ -5,13 +5,9 @@ fmt:
 	go fmt ./...
 vet: fmt
 	go vet ./...
-buildLibUnopt: vet
-	go build -gcflags="all=-N -l" ./...
-unopt: buildLibUnopt
-	go build -C kg/ -gcflags="all=-N -l" -o kg ./...
 buildLib: vet
-	go build ./...
+	go build -gcflags="all=-N -l" ./...
 buildCmd: buildLib
-	go build -C kg/ -o kg ./...
+	go build -C cmd/ -gcflags="all=-N -l" -o re ./...
 test: buildCmd
 	go test -v ./...
--- a/README.md
+++ b/README.md
@ -2,8 +2,8 @@

 Kleingrep is a regular expression engine, providing a library and command-line tool written in Go.

-It aims to provide a more featureful engine, compared to the one in Go's
-[regexp](https://pkg.go.dev/regexp), while retaining some semblance of efficiency.
+It aims to provide a more featureful engine, compared to the one in
+[Go's standard library](https://pkg.go.dev/regexp), while retaining some semblance of efficiency.

 The engine does __not__ use backtracking, relying on the NFA-based method described in
 [Russ Cox's articles](https://swtch.com/~rsc/regexp). As such, it is immune to catastrophic backtracking.
@ -15,7 +15,3 @@ It also includes features not present in regexp, such as lookarounds and backref
 The syntax is, for the most part, a superset of Go's regexp. A full overview of the syntax can be found [here](https://pkg.go.dev/gitea.twomorecents.org/Rockingcool/kleingrep/regex#hdr-Syntax).

 __For more information, see https://pkg.go.dev/gitea.twomorecents.org/Rockingcool/kleingrep/regex__.
-
-### How it works
-
-I've written about the inner workings of the engine [on my blog](https://twomorecents.org/writing-regex-engine/index.html).
--- a/cmd/helpers.go
+++ b/cmd/helpers.go
@ -1,11 +1,6 @@
 package main

-import (
-	"bufio"
-	"os"
-	"slices"
-	"strings"
-)
+import "slices"

 type character interface {
 	int | rune
@ -30,23 +25,3 @@ func genRange[T character](start, end T) []T {
 	}
 	return toRet
 }
-
-// Returns whether or not the given file contains a NULL character
-func fileContainsNullChar(filename string) (bool, error) {
-	file, err := os.Open(filename)
-	if err != nil {
-		return true, err
-	}
-	defer file.Close()
-	scanner := bufio.NewScanner(file)
-	for scanner.Scan() {
-		line := scanner.Text()
-		if strings.Contains(line, "\000") {
-			return true, nil
-		}
-	}
-	if err := scanner.Err(); err != nil {
-		return true, err
-	}
-	return false, nil
-}
--- a/cmd/main.go
+++ b/cmd/main.go
@ -0,0 +1,227 @@
+package main
+
+import (
+	"bufio"
+	"flag"
+	"fmt"
+	"io"
+	"os"
+
+	"github.com/fatih/color"
+
+	reg "gitea.twomorecents.org/Rockingcool/kleingrep/regex"
+)
+
+func main() {
+	// Flags for the regex Compile function
+	flagsToCompile := make([]reg.ReFlag, 0)
+
+	invertFlag := flag.Bool("v", false, "Invert match.")
+	// This flag has two 'modes':
+	// 1. Without '-v': Prints only matches. Prints a newline after every match.
+	// 2. With '-v': Substitutes all matches with empty string.
+	onlyFlag := flag.Bool("o", false, "Print only colored content. Overrides -l.")
+	lineFlag := flag.Bool("l", false, "Only print lines with a match (or with no matches, if -v is enabled). Similar to grep's default.")
+	multiLineFlag := flag.Bool("t", false, "Multi-line mode. Treats newline just like any character.")
+	printMatchesFlag := flag.Bool("p", false, "Prints start and end index of each match. Can only be used with '-t' for multi-line mode.")
+	caseInsensitiveFlag := flag.Bool("i", false, "Case-insensitive. Disregard the case of all characters.")
+	matchNum := flag.Int("m", 0, "Print the match with the given index. Eg. -m 3 prints the third match.")
+	substituteText := flag.String("s", "", "Substitute the contents of each match with the given string. Overrides -o and -v")
+	flag.Parse()
+
+	// These flags have to be passed to the Compile function
+	if *multiLineFlag {
+		flagsToCompile = append(flagsToCompile, reg.RE_MULTILINE, reg.RE_SINGLE_LINE)
+	}
+	if *caseInsensitiveFlag {
+		flagsToCompile = append(flagsToCompile, reg.RE_CASE_INSENSITIVE)
+	}
+
+	// -l and -o are mutually exclusive: -o overrides -l
+	if *onlyFlag {
+		*lineFlag = false
+	}
+	// Check if substitute and matchNum flags have been enabled
+	substituteFlagEnabled := false
+	matchNumFlagEnabled := false
+	flag.Visit(func(f *flag.Flag) {
+		if f.Name == "s" {
+			substituteFlagEnabled = true
+		}
+		if f.Name == "m" {
+			matchNumFlagEnabled = true
+		}
+	})
+
+	// Validate matchNumFlag - must be positive integer
+	if matchNumFlagEnabled && *matchNum < 1 {
+		panic("Invalid match number to print.")
+	}
+
+	// Process:
+	// 1. Convert regex into postfix notation (Shunting-Yard algorithm)
+	// 		a. Add explicit concatenation operators to facilitate this
+	// 2. Build NFA from postfix representation (Thompson's algorithm)
+	// 3. Run the string against the NFA
+
+	if len(flag.Args()) != 1 { // flag.Args() also strips out program name
+		fmt.Println("ERROR: Missing cmdline args")
+		os.Exit(22)
+	}
+	var re string
+	re = flag.Args()[0]
+	var test_str string
+	var err error
+	var linesRead bool // Whether or not we have read the lines in the file
+	lineNum := 0       // Current line number
+	// Create reader for stdin and writer for stdout
+	reader := bufio.NewReader(os.Stdin)
+	out := bufio.NewWriter(os.Stdout)
+
+	regComp, err := reg.Compile(re, flagsToCompile...)
+	if err != nil {
+		fmt.Println(err)
+		return
+	}
+	for true {
+		if linesRead {
+			break
+		}
+		if !(*multiLineFlag) {
+			// Read every string from stdin until we encounter an error. If the error isn't EOF, panic.
+			test_str, err = reader.ReadString('\n')
+			lineNum++
+			if err != nil {
+				if err == io.EOF {
+					linesRead = true
+				} else {
+					panic(err)
+				}
+			}
+			if len(test_str) > 0 && test_str[len(test_str)-1] == '\n' {
+				test_str = test_str[:len(test_str)-1]
+			}
+		} else {
+			// Multi-line mode - read every line of input into a temp. string.
+			// test_str will contain all lines of input (including newline characters)
+			// as one string.
+			var temp string
+			for temp, err = reader.ReadString('\n'); err == nil; temp, err = reader.ReadString('\n') {
+				test_str += temp
+			}
+			// Assuming err != nil
+			if err == io.EOF {
+				if len(temp) > 0 {
+					test_str += temp // Add the last line (if it is non-empty)
+				}
+				linesRead = true
+			} else {
+				panic(err)
+			}
+		}
+		matchIndices := make([]reg.Match, 0)
+		if matchNumFlagEnabled {
+			tmp, err := regComp.FindNthMatch(test_str, *matchNum)
+			if err == nil {
+				matchIndices = append(matchIndices, tmp)
+			}
+		} else {
+			matchIndices = regComp.FindAllSubmatch(test_str)
+		}
+
+		test_str_runes := []rune(test_str) // Converting to runes preserves unicode characters
+
+		if *printMatchesFlag {
+			// if we are in single line mode, print the line on which
+			// the matches occur
+			if len(matchIndices) > 0 {
+				if !(*multiLineFlag) {
+					fmt.Fprintf(out, "Line %d:\n", lineNum)
+				}
+				for _, m := range matchIndices {
+					fmt.Fprintf(out, "%s\n", m.String())
+				}
+				err := out.Flush()
+				if err != nil {
+					panic(err)
+				}
+			}
+			continue
+		}
+		// Decompose the array of matchIndex structs into a flat unique array of ints - if matchIndex is {4,7}, flat array will contain 4,5,6
+		// This should make checking O(1) instead of O(n)
+		indicesToPrint := new_uniq_arr[int]()
+		for _, idx := range matchIndices {
+			indicesToPrint.add(genRange(idx[0].StartIdx, idx[0].EndIdx)...)
+		}
+		// If we are inverting, then we should print the indices which _didn't_ match
+		// in color.
+		if *invertFlag {
+			oldIndices := indicesToPrint.values()
+			indicesToPrint = new_uniq_arr[int]()
+			// Explanation:
+			// Find all numbers from 0 to len(test_str_runes) that are NOT in oldIndices.
+			// These are the values we want to print, now that we have inverted the match.
+			// Re-initialize indicesToPrint and add all of these values to it.
+			indicesToPrint.add(setDifference(genRange(0, len(test_str_runes)), oldIndices)...)
+
+		}
+		// If lineFlag is enabled, we should only print something if:
+		// 		a. We are not inverting, and have at least one match on the current line
+		// 		OR
+		// 		b. We are inverting, and have no matches at all on the current line.
+		// This checks for the inverse, and continues if it is true.
+		if *lineFlag {
+			if !(*invertFlag) && len(matchIndices) == 0 || *invertFlag && len(matchIndices) > 0 {
+				continue
+			}
+		}
+
+		// If we are substituting, we need a different behavior, as follows:
+		// For every character in the test string:
+		// 		1. Check if the index is the start of any matchIndex
+		// 		2. If so, print the substitute text, and set our index to
+		//			the corresponding end index.
+		// 		3. If not, just print the character.
+		if substituteFlagEnabled {
+			for i := range test_str_runes {
+				inMatchIndex := false
+				for _, m := range matchIndices {
+					if i == m[0].StartIdx {
+						fmt.Fprintf(out, "%s", *substituteText)
+						i = m[0].EndIdx
+						inMatchIndex = true
+						break
+					}
+				}
+				if !inMatchIndex {
+					fmt.Fprintf(out, "%c", test_str_runes[i])
+				}
+			}
+		} else {
+			for i, c := range test_str_runes {
+				if indicesToPrint.contains(i) {
+					color.New(color.FgRed).Fprintf(out, "%c", c)
+					// Newline after every match - only if -o is enabled and -v is disabled.
+					if *onlyFlag && !(*invertFlag) {
+						for _, idx := range matchIndices {
+							if i+1 == idx[0].EndIdx { // End index is one more than last index of match
+								fmt.Fprintf(out, "\n")
+								break
+							}
+						}
+					}
+				} else {
+					if !(*onlyFlag) {
+						fmt.Fprintf(out, "%c", c)
+					}
+				}
+			}
+		}
+		err = out.Flush()
+		if err != nil {
+			panic(err)
+		}
+		fmt.Println()
+	}
+}
--- a/cmd/unique_array.go
+++ b/cmd/unique_array.go
@ -36,7 +36,3 @@ func (s uniq_arr[T]) values() []T {
 	}
 	return toRet
 }
-
-func (s uniq_arr[T]) len() int {
-	return len(s.backingMap)
-}
--- a/kg/main.go
+++ b/kg/main.go
@ -1,317 +0,0 @@
-package main
-
-import (
-	"bufio"
-	"flag"
-	"fmt"
-	"io"
-	"io/fs"
-	"os"
-	"path/filepath"
-	"slices"
-
-	"github.com/fatih/color"
-
-	reg "gitea.twomorecents.org/Rockingcool/kleingrep/regex"
-)
-
-func main() {
-	// Flags for the regex Compile function
-	flagsToCompile := make([]reg.ReFlag, 0)
-
-	invertFlag := flag.Bool("v", false, "Invert match.")
-	// This flag has two 'modes':
-	// 1. Without '-v': Prints only matches. Prints a newline after every match.
-	// 2. With '-v': Substitutes all matches with empty string.
-	onlyFlag := flag.Bool("o", false, "Print only colored content. Overrides -l.")
-	lineFlag := flag.Bool("l", false, "Only print lines with a match (or with no matches, if -v is enabled). Similar to grep's default.")
-	multiLineFlag := flag.Bool("t", false, "Multi-line mode. Treats newline just like any character.")
-	printMatchesFlag := flag.Bool("p", false, "Prints start and end index of each match. Can only be used with '-t' for multi-line mode.")
-	caseInsensitiveFlag := flag.Bool("i", false, "Case-insensitive. Disregard the case of all characters.")
-	recursiveFlag := flag.Bool("r", false, "Recursively search all files in the given directory.")
-	lineNumFlag := flag.Bool("n", false, "For each line with a match, print the line number. Implies -l.")
-	matchNum := flag.Int("m", 0, "Print the match with the given index. Eg. -m 3 prints the third match.")
-	substituteText := flag.String("s", "", "Substitute the contents of each match with the given string. Overrides -o and -v")
-	flag.Parse()
-
-	// These flags have to be passed to the Compile function
-	if *multiLineFlag {
-		flagsToCompile = append(flagsToCompile, reg.RE_MULTILINE, reg.RE_SINGLE_LINE)
-	}
-	if *caseInsensitiveFlag {
-		flagsToCompile = append(flagsToCompile, reg.RE_CASE_INSENSITIVE)
-	}
-
-	// -l and -o are mutually exclusive: -o overrides -l
-	if *onlyFlag {
-		*lineFlag = false
-	}
-	// Check if substitute and matchNum flags have been enabled
-	substituteFlagEnabled := false
-	matchNumFlagEnabled := false
-	flag.Visit(func(f *flag.Flag) {
-		if f.Name == "s" {
-			substituteFlagEnabled = true
-		}
-		if f.Name == "m" {
-			matchNumFlagEnabled = true
-		}
-	})
-
-	// Validate matchNumFlag - must be positive integer
-	if matchNumFlagEnabled && *matchNum < 1 {
-		panic("Invalid match number to print.")
-	}
-
-	// Enable lineFlag if lineNumFlag is enabled
-	if *lineNumFlag {
-		*lineFlag = true
-	}
-
-	// Process:
-	// 1. Convert regex into postfix notation (Shunting-Yard algorithm)
-	// 		a. Add explicit concatenation operators to facilitate this
-	// 2. Build NFA from postfix representation (Thompson's algorithm)
-	// 3. Run the string against the NFA
-
-	if len(flag.Args()) < 1 { // flag.Args() also strips out program name
-		fmt.Printf("%s: ERROR: Missing cmdline args\n", os.Args[0])
-		os.Exit(22)
-	}
-	if *recursiveFlag && len(flag.Args()) < 2 { // File/Directory must be provided with '-r'
-		fmt.Printf("%s: ERROR: Missing cmdline args\n", os.Args[0])
-		os.Exit(22)
-	}
-	var re string
-	re = flag.Args()[0]
-	var inputFiles []*os.File
-	if len(flag.Args()) == 1 || flag.Args()[1] == "-" { // Either no file argument, or file argument is "-"
-		if !slices.Contains(inputFiles, os.Stdin) {
-			inputFiles = append(inputFiles, os.Stdin) // os.Stdin cannot be entered more than once into the file list
-		}
-	} else {
-		inputFilenames := flag.Args()[1:]
-		for _, inputFilename := range inputFilenames {
-			inputFile, err := os.Open(inputFilename)
-			defer inputFile.Close()
-			if err != nil {
-				fmt.Printf("%s: %s: No such file or directory\n", os.Args[0], inputFilename)
-			} else {
-				fileStat, err := inputFile.Stat()
-				if err != nil {
-					fmt.Printf("%v\n", err)
-					os.Exit(2)
-				} else {
-					if fileStat.Mode().IsDir() {
-						if *recursiveFlag {
-							// Walk the directory and open every file in it. Add each file to the filelist.
-							filepath.WalkDir(inputFilename, func(filename string, d fs.DirEntry, err error) error {
-								if err != nil {
-									return err
-								}
-								if !d.IsDir() {
-									f, err := os.Open(filename)
-									if err != nil {
-										return err
-									}
-									inputFiles = append(inputFiles, f)
-								}
-								return nil
-							})
-						} else {
-							fmt.Printf("%s: %s: Is a directory\n", os.Args[0], inputFilename)
-						}
-					} else {
-						var nullCharPresent bool
-						if nullCharPresent, err = fileContainsNullChar(inputFilename); nullCharPresent {
-							if err != nil {
-								fmt.Printf("%v\n", err)
-								os.Exit(1)
-							} else {
-								fmt.Printf("%s: %s: Is a binary file\n", os.Args[0], inputFilename)
-							}
-						} else {
-							inputFiles = append(inputFiles, inputFile)
-						}
-					}
-				}
-			}
-		}
-	}
-	if len(inputFiles) == 0 { // No valid files given
-		os.Exit(2)
-	}
-
-	var test_str string
-	var err error
-	var linesRead bool // Whether or not we have read the lines in the file
-	lineNum := 0       // Current line number
-	// Create writer for stdout
-	out := bufio.NewWriter(os.Stdout)
-	// Compile regex
-	regComp, err := reg.Compile(re, flagsToCompile...)
-	if err != nil {
-		fmt.Println(err)
-		return
-	}
-
-	for _, inputFile := range inputFiles {
-		lineNum = 0
-		reader := bufio.NewReader(inputFile)
-		linesRead = false
-		for true {
-			if linesRead {
-				break
-			}
-			if !(*multiLineFlag) {
-				// Read every string from stdin until we encounter an error. If the error isn't EOF, panic.
-				test_str, err = reader.ReadString('\n')
-				lineNum++
-				if err != nil {
-					if err == io.EOF {
-						linesRead = true
-					} else {
-						panic(err)
-					}
-				}
-				if len(test_str) > 0 && test_str[len(test_str)-1] == '\n' {
-					test_str = test_str[:len(test_str)-1]
-				}
-			} else {
-				// Multi-line mode - read every line of input into a temp. string.
-				// test_str will contain all lines of input (including newline characters)
-				// as one string.
-				var temp string
-				for temp, err = reader.ReadString('\n'); err == nil; temp, err = reader.ReadString('\n') {
-					test_str += temp
-				}
-				// Assuming err != nil
-				if err == io.EOF {
-					if len(temp) > 0 {
-						test_str += temp // Add the last line (if it is non-empty)
-					}
-					linesRead = true
-				} else {
-					panic(err)
-				}
-			}
-			matchIndices := make([]reg.Match, 0)
-			if matchNumFlagEnabled {
-				tmp, err := regComp.FindNthMatch(test_str, *matchNum)
-				if err == nil {
-					matchIndices = append(matchIndices, tmp)
-				}
-			} else {
-				matchIndices = regComp.FindAllSubmatch(test_str)
-			}
-
-			test_str_runes := []rune(test_str) // Converting to runes preserves unicode characters
-
-			if *printMatchesFlag {
-				// if we are in single line mode, print the line on which
-				// the matches occur
-				if len(matchIndices) > 0 {
-					if !(*multiLineFlag) {
-						fmt.Fprintf(out, "Line %d:\n", lineNum)
-					}
-					for _, m := range matchIndices {
-						fmt.Fprintf(out, "%s\n", m.String())
-					}
-					err := out.Flush()
-					if err != nil {
-						panic(err)
-					}
-				}
-				continue
-			}
-			// Decompose the array of matchIndex structs into a flat unique array of ints - if matchIndex is {4,7}, flat array will contain 4,5,6
-			// This should make checking O(1) instead of O(n)
-			indicesToPrint := new_uniq_arr[int]()
-			for _, idx := range matchIndices {
-				indicesToPrint.add(genRange(idx[0].StartIdx, idx[0].EndIdx)...)
-			}
-			// If we are inverting, then we should print the indices which _didn't_ match
-			// in color.
-			if *invertFlag {
-				oldIndices := indicesToPrint.values()
-				indicesToPrint = new_uniq_arr[int]()
-				// Explanation:
-				// Find all numbers from 0 to len(test_str_runes) that are NOT in oldIndices.
-				// These are the values we want to print, now that we have inverted the match.
-				// Re-initialize indicesToPrint and add all of these values to it.
-				indicesToPrint.add(setDifference(genRange(0, len(test_str_runes)), oldIndices)...)
-
-			}
-			// If lineFlag is enabled, we should only print something if:
-			// 		a. We are not inverting, and have at least one match on the current line
-			// 		OR
-			// 		b. We are inverting, and have no matches at all on the current line.
-			// This checks for the inverse, and continues if it is true.
-			if *lineFlag {
-				if !(*invertFlag) && len(matchIndices) == 0 || *invertFlag && len(matchIndices) > 0 {
-					continue
-				} else {
-					if *recursiveFlag || len(flag.Args()) > 2 { // If we have 2 args, then we're only searching 1 file. We should only print the filename if there's more than 1 file.
-						color.New(color.FgMagenta).Fprintf(out, "%s:", inputFile.Name()) // Print filename
-					}
-					if *lineNumFlag {
-						color.New(color.FgGreen).Fprintf(out, "%d:", lineNum) // Print filename
-					}
-				}
-			}
-
-			// If we are substituting, we need a different behavior, as follows:
-			// For every character in the test string:
-			// 		1. Check if the index is the start of any matchIndex
-			// 		2. If so, print the substitute text, and set our index to
-			//			the corresponding end index.
-			// 		3. If not, just print the character.
-			if substituteFlagEnabled {
-				for i := range test_str_runes {
-					inMatchIndex := false
-					for _, m := range matchIndices {
-						if i == m[0].StartIdx {
-							fmt.Fprintf(out, "%s", *substituteText)
-							i = m[0].EndIdx
-							inMatchIndex = true
-							break
-						}
-					}
-					if !inMatchIndex {
-						fmt.Fprintf(out, "%c", test_str_runes[i])
-					}
-				}
-			} else {
-				for i, c := range test_str_runes {
-					if indicesToPrint.contains(i) {
-						color.New(color.FgRed, color.Bold).Fprintf(out, "%c", c)
-						// Newline after every match - only if -o is enabled and -v is disabled.
-						if *onlyFlag && !(*invertFlag) {
-							for matchIdxNum, idx := range matchIndices {
-								if matchIdxNum < len(matchIndices)-1 { // Only print a newline afte printing a match, if there are multiple matches on the line, and we aren't on the last one. This is because the newline that gets added at the end will take care of that.
-									if i+1 == idx[0].EndIdx { // End index is one more than last index of match
-										fmt.Fprintf(out, "\n")
-										break
-									}
-								}
-							}
-						}
-					} else {
-						if !(*onlyFlag) {
-							fmt.Fprintf(out, "%c", c)
-						}
-					}
-				}
-			}
-			err = out.Flush()
-			if err != nil {
-				panic(err)
-			}
-			// If the last character in the string wasn't a newline, AND we either have don't -o set or we do (and we've matched something), then print a newline
-			if (len(test_str_runes) > 0 && test_str_runes[len(test_str_runes)-1] != '\n') &&
-				(!*onlyFlag || indicesToPrint.len() > 0) {
-				fmt.Println()
-			}
-		}
-	}
-}
--- a/regex/compile.go
+++ b/regex/compile.go
@ -47,7 +47,6 @@ func (re *Reg) UnmarshalText(text []byte) error {
 	return err
 }

-// Longest makes future searches prefer the longest branch of an alternation, as opposed to the leftmost branch.
 func (re *Reg) Longest() {
 	re.preferLongest = true
 }
@ -411,10 +410,10 @@ func shuntingYard(re string, flags ...ReFlag) ([]postfixNode, error) {
 				if i >= len(re_runes) {
 					return nil, fmt.Errorf("unclosed lookaround")
 				}
-				if (re_runes[i] == '(' && re_runes[i-1] != '\\') || re_runes[i] == nonCapLparenRune {
+				if re_runes[i] == '(' || re_runes[i] == nonCapLparenRune {
 					numOpenParens++
 				}
-				if re_runes[i] == ')' && re_runes[i-1] != '\\' {
+				if re_runes[i] == ')' {
 					numOpenParens--
 					if numOpenParens == 0 {
 						break
@ -499,7 +498,7 @@ func shuntingYard(re string, flags ...ReFlag) ([]postfixNode, error) {
 				}
 			} else if re_postfix[i] == 'p' || re_postfix[i] == 'P' {
 				charClassInverted := (re_postfix[i] == 'P')
-				var charsInClass []rune
+				charsInClass := []rune{}
 				i++
 				if isUnicodeCharClassLetter(re_postfix[i]) {
 					var err error
@ -590,10 +589,10 @@ func shuntingYard(re string, flags ...ReFlag) ([]postfixNode, error) {
 				if i >= len(re_postfix) {
 					return nil, fmt.Errorf("unclosed lookaround")
 				}
-				if (re_postfix[i] == '(' && re_postfix[i-1] != '\\') || re_postfix[i] == nonCapLparenRune {
+				if re_postfix[i] == '(' || re_postfix[i] == nonCapLparenRune {
 					numOpenParens++
 				}
-				if re_postfix[i] == ')' && re_postfix[i-1] != '\\' {
+				if re_postfix[i] == ')' {
 					numOpenParens--
 					if numOpenParens == 0 {
 						break
@ -714,7 +713,7 @@ func shuntingYard(re string, flags ...ReFlag) ([]postfixNode, error) {
 						}
 					} else if re_postfix[i] == 'p' || re_postfix[i] == 'P' {
 						charClassInverted := (re_postfix[i] == 'P')
-						var charsInList []rune
+						charsInList := []rune{}
 						i++
 						if isUnicodeCharClassLetter(re_postfix[i]) {
 							var err error
--- a/regex/doc.go
+++ b/regex/doc.go
@ -161,7 +161,6 @@ The following features from [regexp] are (currently) NOT supported:
 2. Negated POSIX classes
 3. Embedded flags (flags are instead passed as arguments to [Compile])
 4. Literal text with \Q ... \E
- 5. Finite repetition with no start (defaulting at 0)

 The following features are not available in [regexp], but are supported in my engine:
 1. Lookarounds
--- a/regex/nfa.go
+++ b/regex/nfa.go
@ -45,11 +45,11 @@ type nfaState struct {
 	groupBegin                 bool       // Whether or not the node starts a capturing group
 	groupEnd                   bool       // Whether or not the node ends a capturing group
 	groupNum                   int        // Which capturing group the node starts / ends
-	isBackreference            bool       // Whether or not current node is backreference
-	referredGroup              int        // If current node is a backreference, the node that it points to
 	// The following properties depend on the current match - I should think about resetting them for every match.
-	threadGroups  []Group // Assuming that a state is part of a 'thread' in the matching process, this array stores the indices of capturing groups in the current thread. As matches are found for this state, its groups will be copied over.
-	threadBackref int     // If current node is a backreference, how many characters to look forward into the referred group
+	threadGroups    []Group // Assuming that a state is part of a 'thread' in the matching process, this array stores the indices of capturing groups in the current thread. As matches are found for this state, its groups will be copied over.
+	isBackreference bool    // Whether or not current node is backreference
+	referredGroup   int     // If current node is a backreference, the node that it points to
+	threadBackref   int     // If current node is a backreference, how many characters to look forward into the referred group
 }

 // Clones the NFA starting from the given state.
@ -86,8 +86,6 @@ func cloneStateHelper(stateToClone *nfaState, cloneMap map[*nfaState]*nfaState)
 		groupEnd:        stateToClone.groupEnd,
 		groupBegin:      stateToClone.groupBegin,
 		groupNum:        stateToClone.groupNum,
-		isBackreference: stateToClone.isBackreference,
-		referredGroup:   stateToClone.referredGroup,
 	}
 	cloneMap[stateToClone] = clone
 	for i, s := range stateToClone.output {
--- a/regex/postfixNode.go
+++ b/regex/postfixNode.go
@ -131,9 +131,13 @@ func newEscapedNode(c rune, inCharClass bool) (postfixNode, error) {
 	case 'v': // Vertical tab
 		toReturn.nodetype = characterNode
 		toReturn.contents = append(toReturn.contents, rune(11))
-	case '-': // Literal hyphen
-		toReturn.nodetype = characterNode
-		toReturn.contents = append(toReturn.contents, '-')
+	case '-': // Literal hyphen - only in character class
+		if inCharClass {
+			toReturn.nodetype = characterNode
+			toReturn.contents = append(toReturn.contents, '-')
+		} else {
+			return postfixNode{}, fmt.Errorf("invalid escape character")
+		}
 	default: // None of the above - append it as a regular character
 		if isNormalChar(c) { // Normal characters cannot be escaped
 			return postfixNode{}, fmt.Errorf("invalid escape character")
--- a/regex/re_test.go
+++ b/regex/re_test.go
@ -117,7 +117,6 @@ var reTests = []struct {
 	{`\d{3,4}`, nil, "ababab555", []Group{{6, 9}}},
 	{`\bpaint\b`, nil, "paints", []Group{}},
 	{`\b\w{5}\b`, nil, "paint", []Group{{0, 5}}},
-	{`\w{}`, nil, "test", nil},
 	{`[^\w]`, nil, "abcdef1230[]qq';;'", []Group{{10, 11}, {11, 12}, {14, 15}, {15, 16}, {16, 17}, {17, 18}}},
 	{`[^\W]`, nil, "abcdef1230[]qq';;'", []Group{{0, 1}, {1, 2}, {2, 3}, {3, 4}, {4, 5}, {5, 6}, {6, 7}, {7, 8}, {8, 9}, {9, 10}, {12, 13}, {13, 14}}},
 	{`[\[\]]`, nil, "a[b[l]]", []Group{{1, 2}, {3, 4}, {5, 6}, {6, 7}}},
@ -546,22 +545,6 @@ var reTests = []struct {
 	{`\pN+`, nil, `123abc456def`, []Group{{0, 3}, {6, 9}}},
 	{`\PN+`, nil, `123abc456def`, []Group{{3, 6}, {9, 12}}},
 	{`[\p{Greek}\p{Cyrillic}]`, nil, `ΣωШД`, []Group{{0, 1}, {1, 2}, {2, 3}, {3, 4}}},
-
-	{`(?<=\().*?(?=\))`, nil, `(abc)`, []Group{{1, 4}}},
-
-	{`((a|b)\2)`, nil, `aa`, []Group{{0, 2}}},
-	{`((a|b)\2)`, nil, `bb`, []Group{{0, 2}}},
-	{`((a|b)\2)`, nil, `ab`, []Group{}},
-	{`((a|b)\2)`, nil, `ba`, []Group{}},
-
-	{`((a|b)\2){3}`, nil, `aaaaaa`, []Group{{0, 6}}},
-	{`((a|b)\2){3}`, nil, `bbbbbb`, []Group{{0, 6}}},
-	{`((a|b)\2){3}`, nil, `bbaaaa`, []Group{{0, 6}}},
-	{`((a|b)\2){3}`, nil, `aabbaa`, []Group{{0, 6}}},
-	{`((a|b)\2){3}`, nil, `aaaabb`, []Group{{0, 6}}},
-	{`((a|b)\2){3}`, nil, `bbaabb`, []Group{{0, 6}}},
-	{`((a|b)\2){3}`, nil, `baabab`, []Group{}},
-	{`((a|b)\2){3}`, nil, `bbabab`, []Group{}},
 }

 var groupTests = []struct {
--- a/regex/todo.txt
+++ b/regex/todo.txt
@ -4,5 +4,4 @@
 Ideas for flags:
    -m <num> : Print <num>th match (-m 1 = first match, -m 2 = second match)
    -g <num> : Print the <num>th group
-    -r : Specify a directory instead of a file, reads recursively
 4. Refactor code for flags - make each flag's code a function, which modifies the result of findAllMatches