From 0382b6b3bb46a91edc5961a82ad6754409c766ce Mon Sep 17 00:00:00 2001 From: Hadi <112569860+anotherhadi@users.noreply.github.com> Date: Sat, 27 Sep 2025 21:36:02 +0200 Subject: [PATCH] revert Signed-off-by: Hadi <112569860+anotherhadi@users.noreply.github.com> --- leak-utils/parquet/parquet.go | 24 +++++++----------------- 1 file changed, 7 insertions(+), 17 deletions(-) diff --git a/leak-utils/parquet/parquet.go b/leak-utils/parquet/parquet.go index 6071958..af6b7c1 100644 --- a/leak-utils/parquet/parquet.go +++ b/leak-utils/parquet/parquet.go @@ -189,26 +189,16 @@ func configureColumns(input Parquet, skipLineFormating bool) []ColumnOperation { func transformParquet(lu settings.LeakUtils, input, output Parquet, operations []ColumnOperation, deleteFirstRow, printQuery bool) error { var selectClauses []string - var columnsLength []string hasColumns := false for _, op := range operations { - escapedOriginalName := escapeColumnName(op.OriginalName) - if op.Action != "drop" { hasColumns = true - - originalSelectName := op.OriginalName if op.Action == "rename" { - originalSelectName = op.OriginalName - selectClauses = append(selectClauses, fmt.Sprintf("%s AS \"%s\"", originalSelectName, op.NewName)) + selectClauses = append(selectClauses, fmt.Sprintf("%s AS \"%s\"", op.OriginalName, op.NewName)) } else { - selectClauses = append(selectClauses, originalSelectName) + selectClauses = append(selectClauses, op.OriginalName) } - - columnsLength = append(columnsLength, fmt.Sprintf("COALESCE(LENGTH(\"%s\"),0)", escapedOriginalName)) - } else { - columnsLength = append(columnsLength, fmt.Sprintf("COALESCE(LENGTH(\"%s\"),0)", escapedOriginalName)) } } @@ -222,6 +212,10 @@ func transformParquet(lu settings.LeakUtils, input, output Parquet, operations [ compression = ", COMPRESSION '" + output.Compression + "'" } + columnsLength := []string{} + for _, col := range input.Columns { + columnsLength = append(columnsLength, "COALESCE(LENGTH(\""+col+"\"),0)") + } allowedRowSize := 30 * len(input.Columns) offset := "" if deleteFirstRow { @@ -230,7 +224,7 @@ func transformParquet(lu settings.LeakUtils, input, output Parquet, operations [ query := fmt.Sprintf(` COPY ( - SELECT %s  + SELECT %s FROM read_parquet('%s') WHERE (%s) < %d %s ) TO '%s' (FORMAT PARQUET, ROW_GROUP_SIZE 200_000 %s) @@ -288,7 +282,3 @@ func GetParquet(db *sql.DB, inputFile string) (parquet *Parquet, err error) { return } - -func escapeColumnName(name string) string { - return strings.ReplaceAll(name, "\"", "\"\"") -}