From f068a053e1cfffc85816c163c11333bcefb9870f Mon Sep 17 00:00:00 2001 From: Muhammad Luthfi Fahlevi Date: Fri, 9 Aug 2024 15:00:00 +0700 Subject: [PATCH] refactor: make interface for query expr and implement to postgresql and elasticsearch --- core/asset/asset.go | 4 +- core/asset/discovery.go | 2 +- core/asset/service.go | 34 +- .../elasticsearch/discovery_repository.go | 38 +- internal/store/postgres/asset_repository.go | 83 +++- internal/workermanager/discovery_worker.go | 18 +- internal/workermanager/in_situ_worker.go | 7 + pkg/generic_helper/generic_helper.go | 2 +- pkg/query_expr/es_expr.go | 219 ++++++++++ .../equals-or-not-in-condition.json | 0 .../es_test_data}/in-condition.json | 0 .../es_test_data}/lt-condition.json | 0 pkg/query_expr/query_expr.go | 71 ++++ pkg/query_expr/sql_expr.go | 130 ++++++ pkg/translator/query_expr_translator.go | 380 ------------------ pkg/translator/query_expr_translator_test.go | 125 ------ 16 files changed, 550 insertions(+), 563 deletions(-) create mode 100644 pkg/query_expr/es_expr.go rename pkg/{translator/test-json => query_expr/es_test_data}/equals-or-not-in-condition.json (100%) rename pkg/{translator/test-json => query_expr/es_test_data}/in-condition.json (100%) rename pkg/{translator/test-json => query_expr/es_test_data}/lt-condition.json (100%) create mode 100644 pkg/query_expr/query_expr.go create mode 100644 pkg/query_expr/sql_expr.go delete mode 100644 pkg/translator/query_expr_translator.go delete mode 100644 pkg/translator/query_expr_translator_test.go diff --git a/core/asset/asset.go b/core/asset/asset.go index 6fddaf23..794f336a 100644 --- a/core/asset/asset.go +++ b/core/asset/asset.go @@ -12,7 +12,7 @@ import ( type Repository interface { GetAll(context.Context, Filter) ([]Asset, error) GetCount(context.Context, Filter) (int, error) - GetCountByQuery(context.Context, string) (int, error) + GetCountByQueryExpr(context.Context, string, bool) (int, error) GetByID(ctx context.Context, id string) (Asset, error) GetByURN(ctx context.Context, urn string) (Asset, error) GetVersionHistory(ctx context.Context, flt Filter, id string) ([]Asset, error) @@ -22,7 +22,7 @@ type Repository interface { Upsert(ctx context.Context, ast *Asset) (string, error) DeleteByID(ctx context.Context, id string) error DeleteByURN(ctx context.Context, urn string) error - DeleteByQuery(ctx context.Context, whereCondition string) ([]string, error) + DeleteByQueryExpr(ctx context.Context, queryExpr string) ([]string, error) AddProbe(ctx context.Context, assetURN string, probe *Probe) error GetProbes(ctx context.Context, assetURN string) ([]Probe, error) GetProbesWithFilter(ctx context.Context, flt ProbesFilter) (map[string][]Probe, error) diff --git a/core/asset/discovery.go b/core/asset/discovery.go index 4825a241..c7cbeef2 100644 --- a/core/asset/discovery.go +++ b/core/asset/discovery.go @@ -9,7 +9,7 @@ type DiscoveryRepository interface { Upsert(context.Context, Asset) error DeleteByID(ctx context.Context, assetID string) error DeleteByURN(ctx context.Context, assetURN string) error - DeleteByQuery(ctx context.Context, filterQuery string) error + DeleteByQueryExpr(ctx context.Context, filterQuery string) error Search(ctx context.Context, cfg SearchConfig) (results []SearchResult, err error) Suggest(ctx context.Context, cfg SearchConfig) (suggestions []string, err error) GroupAssets(ctx context.Context, cfg GroupConfig) (results []GroupResult, err error) diff --git a/core/asset/service.go b/core/asset/service.go index 2d22b92c..aee14979 100644 --- a/core/asset/service.go +++ b/core/asset/service.go @@ -4,8 +4,6 @@ import ( "context" "fmt" "github.com/google/uuid" - "github.com/goto/compass/pkg/generic_helper" - "github.com/goto/compass/pkg/translator" "go.opentelemetry.io/otel" "go.opentelemetry.io/otel/attribute" "go.opentelemetry.io/otel/metric" @@ -26,7 +24,7 @@ type Service struct { type Worker interface { EnqueueIndexAssetJob(ctx context.Context, ast Asset) error EnqueueDeleteAssetJob(ctx context.Context, urn string) error - EnqueueDeleteAssetsByQueryJob(ctx context.Context, filterQuery string) error + EnqueueDeleteAssetsByQueryExprJob(ctx context.Context, queryExpr string) error EnqueueSyncAssetJob(ctx context.Context, service string) error Close() error } @@ -129,26 +127,7 @@ func (s *Service) DeleteAsset(ctx context.Context, id string) (err error) { } func (s *Service) DeleteAssets(ctx context.Context, queryExpr string, dryRun bool) (affectedRows uint32, err error) { - queryExprTranslator := &translator.QueryExprTranslator{ - QueryExpr: queryExpr, - } - - // Check existence of required identifiers - identifiers := queryExprTranslator.GetIdentifiers() - mustExist := generic_helper.Contains(identifiers, "refreshed_at") && - generic_helper.Contains(identifiers, "type") && - generic_helper.Contains(identifiers, "service") - if !mustExist { - return 0, fmt.Errorf( - "must exists these identifiers: refreshed_at, type. Current identifiers: %v", identifiers) - } - - sqlWhereCondition, err := queryExprTranslator.ConvertToSQL() - if err != nil { - return 0, err - } - - total, err := s.assetRepository.GetCountByQuery(ctx, sqlWhereCondition) + total, err := s.assetRepository.GetCountByQueryExpr(ctx, queryExpr, true) if err != nil { return 0, err } @@ -157,18 +136,13 @@ func (s *Service) DeleteAssets(ctx context.Context, queryExpr string, dryRun boo return uint32(total), nil } - esFilterQuery, err := queryExprTranslator.ConvertToEsQuery() - if err != nil { - return 0, err - } - go func() { - urns, err := s.assetRepository.DeleteByQuery(ctx, sqlWhereCondition) + urns, err := s.assetRepository.DeleteByQueryExpr(ctx, queryExpr) if err != nil { return } - if err := s.worker.EnqueueDeleteAssetsByQueryJob(ctx, esFilterQuery); err != nil { + if err := s.worker.EnqueueDeleteAssetsByQueryExprJob(ctx, queryExpr); err != nil { return } diff --git a/internal/store/elasticsearch/discovery_repository.go b/internal/store/elasticsearch/discovery_repository.go index 68a57d85..09357c13 100644 --- a/internal/store/elasticsearch/discovery_repository.go +++ b/internal/store/elasticsearch/discovery_repository.go @@ -6,6 +6,8 @@ import ( "encoding/json" "errors" "fmt" + generichelper "github.com/goto/compass/pkg/generic_helper" + queryexpr "github.com/goto/compass/pkg/query_expr" "io" "net/url" "strings" @@ -24,6 +26,26 @@ type DiscoveryRepository struct { columnSearchExclusionList []string } +type DeleteAssetESExpr struct { + queryexpr.ESExpr +} + +func (d *DeleteAssetESExpr) Validate() error { + identifiers, err := queryexpr.GetIdentifiers(d.QueryExpr) + if err != nil { + return err + } + + mustExist := generichelper.Contains(identifiers, "refreshed_at") && + generichelper.Contains(identifiers, "type") && + generichelper.Contains(identifiers, "service") + if !mustExist { + return fmt.Errorf("must exists these identifiers: refreshed_at, type. Current identifiers: %v", identifiers) + } + + return nil +} + func NewDiscoveryRepository(cli *Client, logger log.Logger, requestTimeout time.Duration, colSearchExclusionList []string) *DiscoveryRepository { return &DiscoveryRepository{ cli: cli, @@ -144,12 +166,22 @@ func (repo *DiscoveryRepository) DeleteByURN(ctx context.Context, assetURN strin return repo.deleteWithQuery(ctx, "DeleteByURN", fmt.Sprintf(`{"query":{"term":{"urn.keyword": %q}}}`, assetURN)) } -func (repo *DiscoveryRepository) DeleteByQuery(ctx context.Context, filterQuery string) error { - if filterQuery == "" { +func (repo *DiscoveryRepository) DeleteByQueryExpr(ctx context.Context, queryExpr string) error { + if queryExpr == "" { return asset.ErrEmptyQuery } - return repo.deleteWithQuery(ctx, "DeleteByQuery", filterQuery) + deleteAssetESExpr := &DeleteAssetESExpr{ + queryexpr.ESExpr{ + QueryExpr: queryExpr, + }, + } + esQuery, err := queryexpr.ValidateAndGetQueryFromExpr(deleteAssetESExpr) + if err != nil { + return err + } + + return repo.deleteWithQuery(ctx, "DeleteByQueryExpr", esQuery) } func (repo *DiscoveryRepository) deleteWithQuery(ctx context.Context, discoveryOp, qry string) (err error) { diff --git a/internal/store/postgres/asset_repository.go b/internal/store/postgres/asset_repository.go index ed42261b..4c815d85 100644 --- a/internal/store/postgres/asset_repository.go +++ b/internal/store/postgres/asset_repository.go @@ -6,6 +6,8 @@ import ( "encoding/json" "errors" "fmt" + generichelper "github.com/goto/compass/pkg/generic_helper" + queryexpr "github.com/goto/compass/pkg/query_expr" "log" "strings" "time" @@ -17,9 +19,7 @@ import ( "github.com/r3labs/diff/v2" ) -const ( - batchSize = 1000 -) +const batchSize = 1000 // AssetRepository is a type that manages user operation to the primary database type AssetRepository struct { @@ -29,6 +29,26 @@ type AssetRepository struct { defaultUserProvider string } +type DeleteAssetSQLExpr struct { + queryexpr.SQLExpr +} + +func (d *DeleteAssetSQLExpr) Validate() error { + identifiers, err := queryexpr.GetIdentifiers(d.QueryExpr) + if err != nil { + return err + } + + mustExist := generichelper.Contains(identifiers, "refreshed_at") && + generichelper.Contains(identifiers, "type") && + generichelper.Contains(identifiers, "service") + if !mustExist { + return fmt.Errorf("must exists these identifiers: refreshed_at, type. Current identifiers: %v", identifiers) + } + + return nil +} + // GetAll retrieves list of assets with filters func (r *AssetRepository) GetAll(ctx context.Context, flt asset.Filter) ([]asset.Asset, error) { builder := r.getAssetSQL().Offset(uint64(flt.Offset)) @@ -117,8 +137,41 @@ func (r *AssetRepository) GetCount(ctx context.Context, flt asset.Filter) (int, return total, nil } -// GetCountByQuery retrieves number of assets for every type based on query -func (r *AssetRepository) GetCountByQuery(ctx context.Context, sqlQuery string) (int, error) { +// GetCountByQueryExpr retrieves number of assets for every type based on query expr +func (r *AssetRepository) GetCountByQueryExpr(ctx context.Context, queryExpr string, isDeleteExpr bool) (int, error) { + var sqlQuery string + if isDeleteExpr { + deleteExpr := &DeleteAssetSQLExpr{ + queryexpr.SQLExpr{ + QueryExpr: queryExpr, + }, + } + query, err := queryexpr.ValidateAndGetQueryFromExpr(deleteExpr) + if err != nil { + return 0, err + } + sqlQuery = query + } else { + sqlExpr := &queryexpr.SQLExpr{ + QueryExpr: queryExpr, + } + query, err := queryexpr.ValidateAndGetQueryFromExpr(sqlExpr) + if err != nil { + return 0, err + } + sqlQuery = query + } + + total, err := r.getCountByQuery(ctx, sqlQuery) + if err != nil { + return 0, err + } + + return total, err +} + +// GetCountByQueryExpr retrieves number of assets for every type based on query expr +func (r *AssetRepository) getCountByQuery(ctx context.Context, sqlQuery string) (int, error) { builder := sq.Select("count(1)"). From("assets"). Where(sqlQuery) @@ -371,13 +424,23 @@ func (r *AssetRepository) DeleteByURN(ctx context.Context, urn string) error { return nil } -func (r *AssetRepository) DeleteByQuery(ctx context.Context, whereCondition string) ([]string, error) { +func (r *AssetRepository) DeleteByQueryExpr(ctx context.Context, queryExpr string) ([]string, error) { var allURNs []string err := r.client.RunWithinTx(ctx, func(tx *sqlx.Tx) error { + deleteExpr := &DeleteAssetSQLExpr{ + queryexpr.SQLExpr{ + QueryExpr: queryExpr, + }, + } + query, err := queryexpr.ValidateAndGetQueryFromExpr(deleteExpr) + if err != nil { + return err + } + var lastID string for { // Fetch a batch of rows to delete using the last ID as a marker - urns, nextLastID, err := r.getAllURNsWithBatch(ctx, whereCondition, lastID) + urns, nextLastID, err := r.getAllURNsWithBatch(ctx, query, lastID) if err != nil { log.Printf("Failed to get batch to delete: %v", err) return err @@ -647,11 +710,7 @@ func (r *AssetRepository) update(ctx context.Context, assetID string, newAsset, onlyRefreshed := len(clog) == 1 && clog[0].Path[0] == "RefreshedAt" if onlyRefreshed { return r.client.RunWithinTx(ctx, func(tx *sqlx.Tx) error { - if err := r.updateAsset(ctx, tx, assetID, newAsset); err != nil { - return err - } - - return nil + return r.updateAsset(ctx, tx, assetID, newAsset) }) } diff --git a/internal/workermanager/discovery_worker.go b/internal/workermanager/discovery_worker.go index 6a2c70a9..23abac36 100644 --- a/internal/workermanager/discovery_worker.go +++ b/internal/workermanager/discovery_worker.go @@ -15,7 +15,7 @@ import ( type DiscoveryRepository interface { Upsert(context.Context, asset.Asset) error DeleteByURN(ctx context.Context, assetURN string) error - DeleteByQuery(ctx context.Context, filterQuery string) error + DeleteByQueryExpr(ctx context.Context, queryExpr string) error SyncAssets(ctx context.Context, indexName string) (cleanupFn func() error, err error) } @@ -159,13 +159,13 @@ func (m *Manager) DeleteAsset(ctx context.Context, job worker.JobSpec) error { return nil } -func (m *Manager) EnqueueDeleteAssetsByQueryJob(ctx context.Context, filterQuery string) error { +func (m *Manager) EnqueueDeleteAssetsByQueryExprJob(ctx context.Context, queryExpr string) error { err := m.worker.Enqueue(ctx, worker.JobSpec{ Type: jobDeleteAssetsByQuery, - Payload: ([]byte)(filterQuery), + Payload: ([]byte)(queryExpr), }) if err != nil { - return fmt.Errorf("enqueue delete asset job: %w: urn '%s'", err, filterQuery) + return fmt.Errorf("enqueue delete asset job: %w: query expr '%s'", err, queryExpr) } return nil @@ -173,7 +173,7 @@ func (m *Manager) EnqueueDeleteAssetsByQueryJob(ctx context.Context, filterQuery func (m *Manager) deleteAssetsByQueryHandler() worker.JobHandler { return worker.JobHandler{ - Handle: m.DeleteAssetsByQuery, + Handle: m.DeleteAssetsByQueryExpr, JobOpts: worker.JobOptions{ MaxAttempts: 3, Timeout: m.indexTimeout, @@ -182,11 +182,11 @@ func (m *Manager) deleteAssetsByQueryHandler() worker.JobHandler { } } -func (m *Manager) DeleteAssetsByQuery(ctx context.Context, job worker.JobSpec) error { - filterQuery := (string)(job.Payload) - if err := m.discoveryRepo.DeleteByQuery(ctx, filterQuery); err != nil { +func (m *Manager) DeleteAssetsByQueryExpr(ctx context.Context, job worker.JobSpec) error { + queryExpr := (string)(job.Payload) + if err := m.discoveryRepo.DeleteByQueryExpr(ctx, queryExpr); err != nil { return &worker.RetryableError{ - Cause: fmt.Errorf("delete asset from discovery repo: %w: query '%s'", err, filterQuery), + Cause: fmt.Errorf("delete asset from discovery repo: %w: query expr '%s'", err, queryExpr), } } return nil diff --git a/internal/workermanager/in_situ_worker.go b/internal/workermanager/in_situ_worker.go index 0bb28e33..dfdca828 100644 --- a/internal/workermanager/in_situ_worker.go +++ b/internal/workermanager/in_situ_worker.go @@ -40,6 +40,13 @@ func (m *InSituWorker) EnqueueDeleteAssetJob(ctx context.Context, urn string) er return nil } +func (m *InSituWorker) EnqueueDeleteAssetsByQueryExprJob(ctx context.Context, queryExpr string) error { + if err := m.discoveryRepo.DeleteByQueryExpr(ctx, queryExpr); err != nil { + return fmt.Errorf("delete asset from discovery repo: %w: query expr '%s'", err, queryExpr) + } + return nil +} + func (m *InSituWorker) EnqueueSyncAssetJob(ctx context.Context, service string) error { const batchSize = 1000 diff --git a/pkg/generic_helper/generic_helper.go b/pkg/generic_helper/generic_helper.go index 559f2c45..178f1114 100644 --- a/pkg/generic_helper/generic_helper.go +++ b/pkg/generic_helper/generic_helper.go @@ -1,4 +1,4 @@ -package generic_helper +package generichelper // Contains checks if a target item exists in an array of any type. func Contains[T comparable](arr []T, target T) bool { diff --git a/pkg/query_expr/es_expr.go b/pkg/query_expr/es_expr.go new file mode 100644 index 00000000..cab7d9a6 --- /dev/null +++ b/pkg/query_expr/es_expr.go @@ -0,0 +1,219 @@ +package queryexpr + +import ( + "encoding/json" + "fmt" + "github.com/expr-lang/expr/ast" +) + +type ESExpr struct { + QueryExpr string + ESQuery map[string]interface{} +} + +// ToQuery default +func (e *ESExpr) ToQuery() (string, error) { + queryExprParsed, err := GetTreeNodeFromQueryExpr(e.QueryExpr) + if err != nil { + return "", err + } + + esQueryInterface := e.translateToEsQuery(queryExprParsed) + esQuery, ok := esQueryInterface.(map[string]interface{}) + if !ok { + return "", fmt.Errorf("failed to generate Elasticsearch query") + } + e.ESQuery = map[string]interface{}{"query": esQuery} + + // Convert to JSON + queryJSON, err := json.Marshal(e.ESQuery) + if err != nil { + return "", err + } + + return string(queryJSON), nil +} + +// Validate default: no validation +func (*ESExpr) Validate() error { + return nil +} + +// translateToEsQuery The idea came from ast.Walk. Currently, the development focus implement for the node type that most likely used in our needs. +// TODO: implement translator for node type that still not covered right now. +func (e *ESExpr) translateToEsQuery(node *ast.Node) interface{} { + if *node == nil { + return nil + } + switch n := (*node).(type) { + case *ast.BinaryNode: + return e.translateBinaryNodeToEsQuery(n) + case *ast.NilNode: + return nil + case *ast.IdentifierNode: + return n.Value + case *ast.IntegerNode: + return n.Value + case *ast.FloatNode: + return n.Value + case *ast.BoolNode: + return n.Value + case *ast.StringNode: + return n.Value + case *ast.UnaryNode: + return e.translateUnaryNodeToEsQuery(n) + case *ast.ArrayNode: + return e.translateArrayNodeToEsQuery(n) + case *ast.ConstantNode: + return n.Value + case *ast.BuiltinNode: + result, err := GetQueryExprResult(n.String()) + if err != nil { + return nil + } + return result + case *ast.ConditionalNode: + result, err := GetQueryExprResult(n.String()) + if err != nil { + return nil + } + if nodeV, ok := result.(ast.Node); ok { + return e.translateToEsQuery(&nodeV) + } + } + + return nil +} + +func (e *ESExpr) translateBinaryNodeToEsQuery(n *ast.BinaryNode) map[string]interface{} { + left := e.translateToEsQuery(&n.Left) + right := e.translateToEsQuery(&n.Right) + + switch n.Operator { + case "&&": + return e.boolQuery("must", left, right) + case "||": + return e.boolQuery("should", left, right) + case "==": + return e.termQuery(left.(string), right) + case "!=": + return e.mustNotQuery(left.(string), right) + case "<", "<=", ">", ">=": + return e.rangeQuery(left.(string), e.operatorToEsQuery(n.Operator), right) + case "in": + return e.termsQuery(left.(string), right) + default: + return nil + } +} + +func (e *ESExpr) translateUnaryNodeToEsQuery(n *ast.UnaryNode) interface{} { + switch n.Operator { + case "not": + if binaryNode, ok := n.Node.(*ast.BinaryNode); ok && binaryNode.Operator == "in" { + left := e.translateToEsQuery(&binaryNode.Left) + right := e.translateToEsQuery(&binaryNode.Right) + return e.mustNotTermsQuery(left.(string), right) + } + return nil + case "!": + nodeValue := e.translateToEsQuery(&n.Node) + switch value := nodeValue.(type) { + case bool: + return !value + default: + return map[string]interface{}{ + "bool": map[string]interface{}{ + "must_not": []interface{}{nodeValue}, + }, + } + } + default: + return nil + } +} + +func (e *ESExpr) translateArrayNodeToEsQuery(n *ast.ArrayNode) []interface{} { + values := make([]interface{}, len(n.Nodes)) + for i, node := range n.Nodes { + values[i] = e.translateToEsQuery(&node) + } + return values +} + +func (*ESExpr) operatorToEsQuery(operator string) string { + switch operator { + case ">": + return "gt" + case ">=": + return "gte" + case "<": + return "lt" + case "<=": + return "lte" + } + + return operator +} + +func (*ESExpr) boolQuery(condition string, left, right interface{}) map[string]interface{} { + return map[string]interface{}{ + "bool": map[string]interface{}{ + condition: []interface{}{left, right}, + }, + } +} + +func (*ESExpr) termQuery(field string, value interface{}) map[string]interface{} { + return map[string]interface{}{ + "term": map[string]interface{}{ + field: value, + }, + } +} + +func (*ESExpr) mustNotQuery(field string, value interface{}) map[string]interface{} { + return map[string]interface{}{ + "bool": map[string]interface{}{ + "must_not": []interface{}{ + map[string]interface{}{ + "term": map[string]interface{}{ + field: value, + }, + }, + }, + }, + } +} + +func (*ESExpr) rangeQuery(field, operator string, value interface{}) map[string]interface{} { + return map[string]interface{}{ + "range": map[string]interface{}{ + field: map[string]interface{}{ + operator: value, + }, + }, + } +} + +func (*ESExpr) termsQuery(field string, values interface{}) map[string]interface{} { + return map[string]interface{}{ + "terms": map[string]interface{}{ + field: values, + }, + } +} + +func (*ESExpr) mustNotTermsQuery(field string, values interface{}) map[string]interface{} { + return map[string]interface{}{ + "bool": map[string]interface{}{ + "must_not": []interface{}{ + map[string]interface{}{ + "terms": map[string]interface{}{ + field: values, + }, + }, + }, + }, + } +} diff --git a/pkg/translator/test-json/equals-or-not-in-condition.json b/pkg/query_expr/es_test_data/equals-or-not-in-condition.json similarity index 100% rename from pkg/translator/test-json/equals-or-not-in-condition.json rename to pkg/query_expr/es_test_data/equals-or-not-in-condition.json diff --git a/pkg/translator/test-json/in-condition.json b/pkg/query_expr/es_test_data/in-condition.json similarity index 100% rename from pkg/translator/test-json/in-condition.json rename to pkg/query_expr/es_test_data/in-condition.json diff --git a/pkg/translator/test-json/lt-condition.json b/pkg/query_expr/es_test_data/lt-condition.json similarity index 100% rename from pkg/translator/test-json/lt-condition.json rename to pkg/query_expr/es_test_data/lt-condition.json diff --git a/pkg/query_expr/query_expr.go b/pkg/query_expr/query_expr.go new file mode 100644 index 00000000..cf85d2de --- /dev/null +++ b/pkg/query_expr/query_expr.go @@ -0,0 +1,71 @@ +package queryexpr + +import ( + "fmt" + "github.com/expr-lang/expr" + "github.com/expr-lang/expr/ast" + "github.com/expr-lang/expr/parser" +) + +type ExprStr interface { + ToQuery() (string, error) + Validate() error +} + +type QueryExpr struct { + Identifiers []string +} + +type ExprParam map[string]interface{} + +func ValidateAndGetQueryFromExpr(exprStr ExprStr) (string, error) { + if err := exprStr.Validate(); err != nil { + return "", err + } + sqlQuery, err := exprStr.ToQuery() + if err != nil { + return "", err + } + + return sqlQuery, nil +} + +func (s *QueryExpr) Visit(node *ast.Node) { + if n, ok := (*node).(*ast.IdentifierNode); ok { + s.Identifiers = append(s.Identifiers, n.Value) + } +} + +func GetIdentifiers(queryExpr string) ([]string, error) { + queryExprParsed, err := GetTreeNodeFromQueryExpr(queryExpr) + if err != nil { + return nil, err + } + queryExprVisitor := &QueryExpr{} + ast.Walk(queryExprParsed, queryExprVisitor) + return queryExprVisitor.Identifiers, nil +} + +func GetTreeNodeFromQueryExpr(queryExpr string) (*ast.Node, error) { + parsed, err := parser.Parse(queryExpr) + if err != nil { + return nil, fmt.Errorf("error parsing expression: %w", err) + } + + return &parsed.Node, nil +} + +func GetQueryExprResult(fn string) (any, error) { + env := make(ExprParam) + compile, err := expr.Compile(fn) + if err != nil { + return nil, fmt.Errorf("failed to compile function '%s': %w", fn, err) + } + + result, err := expr.Run(compile, env) + if err != nil { + return nil, fmt.Errorf("failed to evaluate function '%s': %w", fn, err) + } + + return result, nil +} diff --git a/pkg/query_expr/sql_expr.go b/pkg/query_expr/sql_expr.go new file mode 100644 index 00000000..3f2ac6fa --- /dev/null +++ b/pkg/query_expr/sql_expr.go @@ -0,0 +1,130 @@ +package queryexpr + +import ( + "fmt" + "github.com/expr-lang/expr/ast" + "strconv" + "strings" +) + +type SQLExpr struct { + QueryExpr string + SQLQuery strings.Builder +} + +// ToQuery default +func (s *SQLExpr) ToQuery() (string, error) { + queryExprParsed, err := GetTreeNodeFromQueryExpr(s.QueryExpr) + if err != nil { + return "", err + } + s.ConvertToSQL(queryExprParsed) + return s.SQLQuery.String(), nil +} + +// Validate default: no validation +func (*SQLExpr) Validate() error { + return nil +} + +// ConvertToSQL The idea came from ast.Walk. Currently, the development focus implement for the node type that most likely used in our needs. +// TODO: implement translator for node type that still not covered right now. +func (s *SQLExpr) ConvertToSQL(node *ast.Node) { + if *node == nil { + return + } + switch n := (*node).(type) { + case *ast.BinaryNode: + s.SQLQuery.WriteString("(") + s.ConvertToSQL(&n.Left) + + // write operator + operator := s.operatorToSQL(n) + s.SQLQuery.WriteString(fmt.Sprintf(" %s ", strings.ToUpper(operator))) + + s.ConvertToSQL(&n.Right) + s.SQLQuery.WriteString(")") + case *ast.NilNode: + s.SQLQuery.WriteString("NULL") + case *ast.IdentifierNode: + s.SQLQuery.WriteString(n.Value) + case *ast.IntegerNode: + s.SQLQuery.WriteString(strconv.FormatInt(int64(n.Value), 10)) + case *ast.FloatNode: + s.SQLQuery.WriteString(strconv.FormatFloat(n.Value, 'f', -1, 64)) + case *ast.BoolNode: + s.SQLQuery.WriteString(strconv.FormatBool(n.Value)) + case *ast.StringNode: + s.SQLQuery.WriteString(fmt.Sprintf("'%s'", n.Value)) + case *ast.ConstantNode: + s.SQLQuery.WriteString(fmt.Sprintf("%s", n.Value)) + case *ast.UnaryNode: + s.patchUnaryNode(n) + s.ConvertToSQL(&n.Node) + case *ast.BuiltinNode: + result, err := GetQueryExprResult(n.String()) + if err != nil { + return + } + s.SQLQuery.WriteString(fmt.Sprintf("%s", result)) + case *ast.ArrayNode: + s.SQLQuery.WriteString("(") + for i := range n.Nodes { + s.ConvertToSQL(&n.Nodes[i]) + if i != len(n.Nodes)-1 { + s.SQLQuery.WriteString(", ") + } + } + s.SQLQuery.WriteString(")") + case *ast.ConditionalNode: + result, err := GetQueryExprResult(n.String()) + if err != nil { + return + } + if nodeV, ok := result.(ast.Node); ok { + s.ConvertToSQL(&nodeV) + } + } +} + +func (*SQLExpr) patchUnaryNode(n *ast.UnaryNode) { + switch n.Operator { + case "not": + binaryNode, ok := (n.Node).(*ast.BinaryNode) + if ok && binaryNode.Operator == "in" { + ast.Patch(&n.Node, &ast.BinaryNode{ + Operator: "not in", + Left: binaryNode.Left, + Right: binaryNode.Right, + }) + } + case "!": + switch nodeV := n.Node.(type) { + case *ast.BoolNode: + ast.Patch(&n.Node, &ast.BoolNode{ + Value: !nodeV.Value, + }) + // TODO: adjust other types if needed + } + } +} + +func (*SQLExpr) operatorToSQL(bn *ast.BinaryNode) string { + switch { + case bn.Operator == "&&": + return "AND" + case bn.Operator == "||": + return "OR" + case bn.Operator == "!=": + if _, ok := bn.Right.(*ast.NilNode); ok { + return "IS NOT" + } + case bn.Operator == "==": + if _, ok := bn.Right.(*ast.NilNode); ok { + return "IS" + } + return "=" + } + + return bn.Operator +} diff --git a/pkg/translator/query_expr_translator.go b/pkg/translator/query_expr_translator.go deleted file mode 100644 index 2e06392d..00000000 --- a/pkg/translator/query_expr_translator.go +++ /dev/null @@ -1,380 +0,0 @@ -package translator - -import ( - "encoding/json" - "errors" - "fmt" - "github.com/expr-lang/expr" - "github.com/expr-lang/expr/ast" - "github.com/expr-lang/expr/parser" - "log" - "strconv" - "strings" -) - -type ExprParam map[string]interface{} - -type QueryExprTranslator struct { - QueryExpr string - SqlQuery strings.Builder - EsQuery map[string]interface{} - Identifiers []string -} - -func (q *QueryExprTranslator) Visit(node *ast.Node) { - if n, ok := (*node).(*ast.IdentifierNode); ok { - q.Identifiers = append(q.Identifiers, n.Value) - } -} - -func (q *QueryExprTranslator) GetIdentifiers() []string { - ast.Walk(q.getTreeNodeFromQueryExpr(), q) - return q.Identifiers -} - -func (q *QueryExprTranslator) getTreeNodeFromQueryExpr() *ast.Node { - parsed, err := parser.Parse(q.QueryExpr) - if err != nil { - log.Fatalf("Error parsing expression: %v", err) - } - - return &parsed.Node -} - -func (q *QueryExprTranslator) ConvertToSQL() (string, error) { - q.SqlQuery = strings.Builder{} - q.translateToSQL(q.getTreeNodeFromQueryExpr(), q) - return q.SqlQuery.String(), nil -} - -// translateToSQL The idea came from ast.Walk. Currently, the development focus implement for the node type that most likely used in our needs. -// TODO: implement translator for node type that still not covered right now. -func (q *QueryExprTranslator) translateToSQL(node *ast.Node, translator *QueryExprTranslator) { - if *node == nil { - return - } - switch n := (*node).(type) { - case *ast.BinaryNode: - translator.SqlQuery.WriteString("(") - q.translateToSQL(&n.Left, translator) - - // write operator - operator := q.operatorToSQL(n) - translator.SqlQuery.WriteString(fmt.Sprintf(" %s ", strings.ToUpper(operator))) - - q.translateToSQL(&n.Right, translator) - translator.SqlQuery.WriteString(")") - case *ast.NilNode: - translator.SqlQuery.WriteString(fmt.Sprintf("%s", "NULL")) - case *ast.IdentifierNode: - translator.SqlQuery.WriteString(n.Value) - case *ast.IntegerNode: - translator.SqlQuery.WriteString(strconv.FormatInt(int64(n.Value), 10)) - case *ast.FloatNode: - translator.SqlQuery.WriteString(strconv.FormatFloat(n.Value, 'f', -1, 64)) - case *ast.BoolNode: - translator.SqlQuery.WriteString(strconv.FormatBool(n.Value)) - case *ast.StringNode: - translator.SqlQuery.WriteString(fmt.Sprintf("'%s'", n.Value)) - case *ast.ConstantNode: - translator.SqlQuery.WriteString(fmt.Sprintf("%s", n.Value)) - case *ast.UnaryNode: - switch n.Operator { - case "not": - binaryNode, ok := (n.Node).(*ast.BinaryNode) - if ok && binaryNode.Operator == "in" { - ast.Patch(&n.Node, &ast.BinaryNode{ - Operator: "not in", - Left: binaryNode.Left, - Right: binaryNode.Right, - }) - } - case "!": - switch nodeV := n.Node.(type) { - case *ast.BoolNode: - ast.Patch(&n.Node, &ast.BoolNode{ - Value: !nodeV.Value, - }) - // adjust other type if needed - } - } - q.translateToSQL(&n.Node, translator) - case *ast.BuiltinNode: - result, err := q.getQueryExprResult(n.String()) - if err != nil { - return - } - translator.SqlQuery.WriteString(fmt.Sprintf("%s", result)) - case *ast.ArrayNode: - translator.SqlQuery.WriteString("(") - for i := range n.Nodes { - q.translateToSQL(&n.Nodes[i], translator) - if i != len(n.Nodes)-1 { - translator.SqlQuery.WriteString(", ") - } - } - translator.SqlQuery.WriteString(")") - case *ast.ConditionalNode: - result, err := q.getQueryExprResult(n.String()) - if err != nil { - return - } - if nodeV, ok := result.(ast.Node); ok { - q.translateToSQL(&nodeV, translator) - } - case *ast.ChainNode: - case *ast.MemberNode: - case *ast.SliceNode: - case *ast.CallNode: - case *ast.ClosureNode: - case *ast.PointerNode: - case *ast.VariableDeclaratorNode: - case *ast.MapNode: - case *ast.PairNode: - default: - panic(fmt.Sprintf("undefined node type (%T)", node)) - } -} - -func (q *QueryExprTranslator) getQueryExprResult(fn string) (any, error) { - env := make(ExprParam) - compile, err := expr.Compile(fn) - if err != nil { - return nil, fmt.Errorf("failed to compile function '%s': %w", fn, err) - } - - result, err := expr.Run(compile, env) - if err != nil { - return nil, fmt.Errorf("failed to evaluate function '%s': %w", fn, err) - } - - return result, nil -} - -func (q *QueryExprTranslator) operatorToSQL(bn *ast.BinaryNode) string { - switch { - case bn.Operator == "&&": - return "AND" - case bn.Operator == "||": - return "OR" - case bn.Operator == "!=": - if _, ok := bn.Right.(*ast.NilNode); ok { - return "IS NOT" - } - case bn.Operator == "==": - if _, ok := bn.Right.(*ast.NilNode); ok { - return "IS" - } else { - return "=" - } - } - - return bn.Operator -} - -func (q *QueryExprTranslator) ConvertToEsQuery() (string, error) { - esQueryInterface := q.translateToEsQuery(q.getTreeNodeFromQueryExpr()) - esQuery, ok := esQueryInterface.(map[string]interface{}) - if !ok { - return "", errors.New("failed to generate Elasticsearch query") - } - q.EsQuery = map[string]interface{}{"query": esQuery} - - // Convert to JSON - queryJSON, err := json.Marshal(q.EsQuery) - if err != nil { - return "", err - } - - return string(queryJSON), nil -} - -// translateToEsQuery The idea came from ast.Walk. Currently, the development focus implement for the node type that most likely used in our needs. -// TODO: implement translator for node type that still not covered right now. -func (q *QueryExprTranslator) translateToEsQuery(node *ast.Node) interface{} { - if *node == nil { - return nil - } - switch n := (*node).(type) { - case *ast.BinaryNode: - return q.translateBinaryNodeToEsQuery(n) - case *ast.NilNode: - return nil - case *ast.IdentifierNode: - return n.Value - case *ast.IntegerNode: - return n.Value - case *ast.FloatNode: - return n.Value - case *ast.BoolNode: - return n.Value - case *ast.StringNode: - return n.Value - case *ast.UnaryNode: - return q.translateUnaryNodeToEsQuery(n) - case *ast.ArrayNode: - return q.translateArrayNodeToEsQuery(n) - case *ast.ConstantNode: - return n.Value - case *ast.BuiltinNode: - result, err := q.getQueryExprResult(n.String()) - if err != nil { - return nil - } - return result - case *ast.ConditionalNode: - result, err := q.getQueryExprResult(n.String()) - if err != nil { - return nil - } - if nodeV, ok := result.(ast.Node); ok { - return q.translateToEsQuery(&nodeV) - } - case *ast.ChainNode: - case *ast.MemberNode: - case *ast.SliceNode: - case *ast.CallNode: - case *ast.ClosureNode: - case *ast.PointerNode: - case *ast.VariableDeclaratorNode: - case *ast.MapNode: - case *ast.PairNode: - default: - panic(fmt.Sprintf("undefined node type (%T)", node)) - } - - return nil -} - -func (q *QueryExprTranslator) translateBinaryNodeToEsQuery(n *ast.BinaryNode) map[string]interface{} { - left := q.translateToEsQuery(&n.Left) - right := q.translateToEsQuery(&n.Right) - - switch n.Operator { - case "&&": - return q.boolQuery("must", left, right) - case "||": - return q.boolQuery("should", left, right) - case "==": - return q.termQuery(left.(string), right) - case "!=": - return q.mustNotQuery(left.(string), right) - case "<", "<=", ">", ">=": - return q.rangeQuery(left.(string), q.operatorToEsQuery(n.Operator), right) - case "in": - return q.termsQuery(left.(string), right) - default: - return nil - } -} - -func (q *QueryExprTranslator) translateUnaryNodeToEsQuery(n *ast.UnaryNode) interface{} { - switch n.Operator { - case "not": - if binaryNode, ok := n.Node.(*ast.BinaryNode); ok && binaryNode.Operator == "in" { - left := q.translateToEsQuery(&binaryNode.Left) - right := q.translateToEsQuery(&binaryNode.Right) - return q.mustNotTermsQuery(left.(string), right) - } - return nil - case "!": - nodeValue := q.translateToEsQuery(&n.Node) - switch value := nodeValue.(type) { - case bool: - return !value - default: - return map[string]interface{}{ - "bool": map[string]interface{}{ - "must_not": []interface{}{nodeValue}, - }, - } - } - default: - return nil - } -} - -func (q *QueryExprTranslator) translateArrayNodeToEsQuery(n *ast.ArrayNode) []interface{} { - values := make([]interface{}, len(n.Nodes)) - for i, node := range n.Nodes { - values[i] = q.translateToEsQuery(&node) - } - return values -} - -func (q *QueryExprTranslator) operatorToEsQuery(operator string) string { - switch operator { - case ">": - return "gt" - case ">=": - return "gte" - case "<": - return "lt" - case "<=": - return "lte" - } - - return operator -} - -func (q *QueryExprTranslator) boolQuery(condition string, left, right interface{}) map[string]interface{} { - return map[string]interface{}{ - "bool": map[string]interface{}{ - condition: []interface{}{left, right}, - }, - } -} - -func (q *QueryExprTranslator) termQuery(field string, value interface{}) map[string]interface{} { - return map[string]interface{}{ - "term": map[string]interface{}{ - field: value, - }, - } -} - -func (q *QueryExprTranslator) mustNotQuery(field string, value interface{}) map[string]interface{} { - return map[string]interface{}{ - "bool": map[string]interface{}{ - "must_not": []interface{}{ - map[string]interface{}{ - "term": map[string]interface{}{ - field: value, - }, - }, - }, - }, - } -} - -func (q *QueryExprTranslator) rangeQuery(field, operator string, value interface{}) map[string]interface{} { - return map[string]interface{}{ - "range": map[string]interface{}{ - field: map[string]interface{}{ - operator: value, - }, - }, - } -} - -func (q *QueryExprTranslator) termsQuery(field string, values interface{}) map[string]interface{} { - return map[string]interface{}{ - "terms": map[string]interface{}{ - field: values, - }, - } -} - -func (q *QueryExprTranslator) mustNotTermsQuery(field string, values interface{}) map[string]interface{} { - return map[string]interface{}{ - "bool": map[string]interface{}{ - "must_not": []interface{}{ - map[string]interface{}{ - "terms": map[string]interface{}{ - field: values, - }, - }, - }, - }, - } -} diff --git a/pkg/translator/query_expr_translator_test.go b/pkg/translator/query_expr_translator_test.go deleted file mode 100644 index 23d329ed..00000000 --- a/pkg/translator/query_expr_translator_test.go +++ /dev/null @@ -1,125 +0,0 @@ -package translator - -import ( - "encoding/json" - "fmt" - "io/ioutil" - "reflect" - "testing" -) - -func TestQueryExprTranslator_ConvertToEsQuery(t *testing.T) { - tests := []struct { - name string - queryExprTranslator *QueryExprTranslator - want string - wantErr bool - }{ - { - name: "less than condition", - queryExprTranslator: &QueryExprTranslator{ - QueryExpr: `updated_at < "2024-04-05 23:59:59"`, - }, - want: "test-json/lt-condition.json", - wantErr: false, - }, - { - name: "in condition", - queryExprTranslator: &QueryExprTranslator{ - QueryExpr: `service in ["test1","test2","test3"]`, - }, - want: "test-json/in-condition.json", - wantErr: false, - }, - { - name: "equals or not in condition", - queryExprTranslator: &QueryExprTranslator{ - QueryExpr: `name == "John" || service not in ["test1","test2","test3"]`, - }, - want: "test-json/equals-or-not-in-condition.json", - wantErr: false, - }, - } - for _, tt := range tests { - t.Run(tt.name, func(t *testing.T) { - got, err := tt.queryExprTranslator.ConvertToEsQuery() - if (err != nil) != tt.wantErr { - t.Errorf("ConvertToEsQuery() error = %v, wantErr %v", err, tt.wantErr) - return - } - if !deepEqual(tt.want, tt.queryExprTranslator.EsQuery) { - t.Errorf("ConvertToEsQuery() got = %v, want equal to json in file: %v", got, tt.want) - } - }) - } -} - -func TestQueryExprTranslator_ConvertToSQL(t *testing.T) { - tests := []struct { - name string - queryExprTranslator *QueryExprTranslator - want string - wantErr bool - }{ - { - name: "less than condition", - queryExprTranslator: &QueryExprTranslator{ - QueryExpr: `updated_at < "2024-04-05 23:59:59"`, - }, - want: `(updated_at < '2024-04-05 23:59:59')`, - wantErr: false, - }, - { - name: "in condition", - queryExprTranslator: &QueryExprTranslator{ - QueryExpr: `service in ["test1","test2","test3"]`, - }, - want: `(service IN ('test1', 'test2', 'test3'))`, - wantErr: false, - }, - { - name: "equals or not in condition", - queryExprTranslator: &QueryExprTranslator{ - QueryExpr: `name == "John" || service not in ["test1","test2","test3"]`, - }, - want: `((name = 'John') OR (service NOT IN ('test1', 'test2', 'test3')))`, - wantErr: false, - }, - } - for _, tt := range tests { - t.Run(tt.name, func(t *testing.T) { - got, err := tt.queryExprTranslator.ConvertToSQL() - if (err != nil) != tt.wantErr { - t.Errorf("ConvertToSQL() error = %v, wantErr %v", err, tt.wantErr) - return - } - if got != tt.want { - t.Errorf("ConvertToSQL() got = %v, want %v", got, tt.want) - } - }) - } -} - -func deepEqual(jsonFileName string, result map[string]interface{}) bool { - // Step 1: Read the JSON file - fileContent, err := ioutil.ReadFile(jsonFileName) - if err != nil { - fmt.Println("Error reading the file:", err) - return false - } - - // Step 2: Unmarshal the file content into a Go data structure - var fileData map[string]interface{} - err = json.Unmarshal(fileContent, &fileData) - if err != nil { - fmt.Println("Error unmarshalling the file content:", err) - return false - } - - // Step 4: Compare the two Go data structures - if reflect.DeepEqual(fileData, result) { - return true - } else { - return false - } -}