-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathiterator.go
81 lines (64 loc) · 1.63 KB
/
iterator.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
package main
import (
"regexp"
"strings"
)
type Mapping struct {
Col string
Faker string
}
type Iterator struct {
Mappings []Mapping
table string
columns []string
transformers []Anonymizer
}
func (i *Iterator) ProcessLine(line string) string {
if strings.HasPrefix(line, "COPY") {
i.processTable(line)
return line
} else if i.table != "" && strings.TrimSpace(line) != "" {
return i.processRow(line)
} else {
i.table = ""
return line
}
}
func (i *Iterator) processTable(line string) {
i.table = Gsub(line, "^COPY (.*?) .*$")
i.columns = getColumns(Gsub(line, `^COPY (?:.*?) \((.*)\).*$`))
i.transformers = getTransformers(i.columns, i.Mappings)
}
func (i Iterator) processRow(line string) string {
values := strings.Split(line, "\t")
result := make([]string, len(values))
for index, value := range values {
result[index] = i.transformers[index].Fake(value)
}
return strings.Join(result[:], "\t")
}
func getColumns(columns string) []string {
return Map(strings.Split(columns, ","), func(v string) string {
re := regexp.MustCompile(`"`)
s := strings.TrimSpace(v)
s = re.ReplaceAllString(s, "")
s = strings.ToLower(s)
return s
})
}
func getTransformers(columns []string, mappings []Mapping) []Anonymizer {
result := make([]Anonymizer, len(columns))
for index, column := range columns {
mapping := getMapping(mappings, column)
result[index] = Anonymizer{Type: mapping.Faker}
}
return result
}
func getMapping(mappings []Mapping, column string) Mapping {
for _, mapping := range mappings {
if mapping.Col == column {
return mapping
}
}
return Mapping{Col: column, Faker: ""}
}