feat: scanning string with sql tokenizer
This commit is contained in:
parent
6fe01c4821
commit
518316c4f7
5
go.mod
Normal file
5
go.mod
Normal file
@ -0,0 +1,5 @@
|
|||||||
|
module query-inter
|
||||||
|
|
||||||
|
go 1.23.7
|
||||||
|
|
||||||
|
require github.com/DataDog/go-sqllexer v0.1.3
|
10
go.sum
Normal file
10
go.sum
Normal file
@ -0,0 +1,10 @@
|
|||||||
|
github.com/DataDog/go-sqllexer v0.1.3 h1:Kl2T6QVndMEZqQSY8rkoltYP+LVNaA54N+EwAMc9N5w=
|
||||||
|
github.com/DataDog/go-sqllexer v0.1.3/go.mod h1:KwkYhpFEVIq+BfobkTC1vfqm4gTi65skV/DpDBXtexc=
|
||||||
|
github.com/davecgh/go-spew v1.1.1 h1:vj9j/u1bqnvCEfJOwUhtlOARqs3+rkHYY13jYWTU97c=
|
||||||
|
github.com/davecgh/go-spew v1.1.1/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
|
||||||
|
github.com/pmezard/go-difflib v1.0.0 h1:4DBwDE0NGyQoBHbLQYPwSUPoCMWR5BEzIk/f1lZbAQM=
|
||||||
|
github.com/pmezard/go-difflib v1.0.0/go.mod h1:iKH77koFhYxTK1pcRnkKkqfTogsbg7gZNVY4sRDYZ/4=
|
||||||
|
github.com/stretchr/testify v1.8.4 h1:CcVxjf3Q8PM0mHUKJCdn+eZZtm5yQwehR5yeSVQQcUk=
|
||||||
|
github.com/stretchr/testify v1.8.4/go.mod h1:sz/lmYIOXD/1dqDmKjjqLyZ2RngseejIcXlSw2iwfAo=
|
||||||
|
gopkg.in/yaml.v3 v3.0.1 h1:fxVm/GzAzEWqLHuvctI91KS9hhNmmWOoWu0XTYJS7CA=
|
||||||
|
gopkg.in/yaml.v3 v3.0.1/go.mod h1:K4uyk7z7BCEPqu6E+C64Yfv1cQ7kz7rIZviUmN+EgEM=
|
83
main.go
Normal file
83
main.go
Normal file
@ -0,0 +1,83 @@
|
|||||||
|
package main
|
||||||
|
|
||||||
|
import (
|
||||||
|
"fmt"
|
||||||
|
"github.com/DataDog/go-sqllexer"
|
||||||
|
)
|
||||||
|
|
||||||
|
type TokenGroupType int
|
||||||
|
|
||||||
|
const (
|
||||||
|
TOKEN_OTHER TokenGroupType = iota
|
||||||
|
TOKEN_ACT // SELECT, CREATE, etc
|
||||||
|
TOKEN_FILTER // WHERE, AND, etc
|
||||||
|
TOKEN_RELATE // joins
|
||||||
|
TOKEN_DEFINE // column data types, etc
|
||||||
|
TOKEN_CONTROL // sorting, etc
|
||||||
|
)
|
||||||
|
|
||||||
|
var tokenGroupMap = map[sqllexer.TokenType]TokenGroupType{
|
||||||
|
sqllexer.ERROR: TOKEN_OTHER,
|
||||||
|
sqllexer.EOF: TOKEN_OTHER,
|
||||||
|
sqllexer.SPACE: TOKEN_OTHER,
|
||||||
|
sqllexer.STRING: TOKEN_DEFINE,
|
||||||
|
sqllexer.INCOMPLETE_STRING: TOKEN_DEFINE,
|
||||||
|
sqllexer.NUMBER: TOKEN_DEFINE,
|
||||||
|
sqllexer.IDENT: TOKEN_ACT, // for table/column names
|
||||||
|
sqllexer.QUOTED_IDENT: TOKEN_RELATE, // for joins
|
||||||
|
sqllexer.OPERATOR: TOKEN_FILTER,
|
||||||
|
sqllexer.WILDCARD: TOKEN_ACT,
|
||||||
|
sqllexer.COMMENT: TOKEN_OTHER,
|
||||||
|
sqllexer.MULTILINE_COMMENT: TOKEN_OTHER,
|
||||||
|
sqllexer.PUNCTUATION: TOKEN_OTHER,
|
||||||
|
sqllexer.DOLLAR_QUOTED_FUNCTION: TOKEN_DEFINE,
|
||||||
|
sqllexer.DOLLAR_QUOTED_STRING: TOKEN_DEFINE,
|
||||||
|
sqllexer.POSITIONAL_PARAMETER: TOKEN_FILTER,
|
||||||
|
sqllexer.BIND_PARAMETER: TOKEN_FILTER,
|
||||||
|
sqllexer.FUNCTION: TOKEN_DEFINE,
|
||||||
|
sqllexer.SYSTEM_VARIABLE: TOKEN_DEFINE,
|
||||||
|
sqllexer.UNKNOWN: TOKEN_OTHER,
|
||||||
|
sqllexer.COMMAND: TOKEN_ACT,
|
||||||
|
sqllexer.KEYWORD: TOKEN_ACT,
|
||||||
|
sqllexer.JSON_OP: TOKEN_DEFINE,
|
||||||
|
sqllexer.BOOLEAN: TOKEN_DEFINE,
|
||||||
|
sqllexer.NULL: TOKEN_DEFINE,
|
||||||
|
sqllexer.PROC_INDICATOR: TOKEN_OTHER,
|
||||||
|
sqllexer.CTE_INDICATOR: TOKEN_OTHER,
|
||||||
|
sqllexer.ALIAS_INDICATOR: TOKEN_OTHER,
|
||||||
|
}
|
||||||
|
|
||||||
|
func GetTokenGroupType(tokenType sqllexer.TokenType) (TokenGroupType, bool, bool) {
|
||||||
|
group, exists := tokenGroupMap[tokenType]
|
||||||
|
isStart := false
|
||||||
|
isEnd := false
|
||||||
|
|
||||||
|
if !exists {
|
||||||
|
group = TOKEN_OTHER
|
||||||
|
}
|
||||||
|
|
||||||
|
if group == TOKEN_ACT {
|
||||||
|
isStart = true
|
||||||
|
}
|
||||||
|
|
||||||
|
if tokenType == sqllexer.EOF ||
|
||||||
|
(group == TOKEN_OTHER && tokenType == sqllexer.PUNCTUATION) {
|
||||||
|
isEnd = true
|
||||||
|
}
|
||||||
|
|
||||||
|
return group, isStart, isEnd
|
||||||
|
}
|
||||||
|
|
||||||
|
func main() {
|
||||||
|
query := "SELECT * FROM users \n WHERE id = something AND SELECT;"
|
||||||
|
lexer := sqllexer.New(query)
|
||||||
|
for {
|
||||||
|
token := lexer.Scan()
|
||||||
|
tokenGroup, isStart, isEnd := GetTokenGroupType(token.Type)
|
||||||
|
fmt.Println(token.Value, token.Type, tokenGroup, isStart, isEnd)
|
||||||
|
|
||||||
|
if token.Type == sqllexer.EOF {
|
||||||
|
break
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
Loading…
x
Reference in New Issue
Block a user