1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
|
package main
// Takes one file as the `src` and another as the `check` (passed via -c).
// Ensures that all entries in `check` are in `src`, returning as missing all
// entries in `check` that are missing from `src`.
// To check all that are in `src` missing in `check`, you can firstly simply
// switch around the order of parameters, or otherwise use bt-present, which
// returns either a true or false that all entries on `src` are on `check`,
// which could be used to weed out any incorrect values on `src`.
import (
bt "badtudexo"
st "saggytrousers"
xl "github.com/xuri/excelize/v2"
"os"
"fmt"
)
func usage() {
fmt.Println(
`bt-missing: check whether entries on check are missing on src.
You must pass two files: a source file (src, passed as an argument) and
a check file (check, passed with --check). This script will iterate
over all entries in the check file, and output all which are missing on
the source file.
This script has fundmentally two uses.
The first is: given a larger file, check all which are _not_ on the
smaller file. To perform this, run:
bt-missing -c large.xlsx small.xlsx
The second is: expand the output of bt-present. bt-present returns a
boolean whether all entries on the source file are present in the
check file. If bt-present returns false, you may wish to get the
entries that are missing. To do this, invoke bt-missing with the
positions of the arguments reversed:
bt-present -c check.xlsx src.xlsx
bt-missing -c src.xlsx check.xlsx
This can be a little confusing - if in doubt, just switch them around
and see whichever one looks right!
You may specify the sheet and the columns to check against as flags
here so you do not need to specify them when the script is running.
You can additionally specify an output file with -o or --output; the
output of this command will be copied into the output file.
If the specific sheets and columns are known, it can help to pass them
as flags, saving you to have to confirm them when the program is
running.
Flags:
-h, --help Display this help message.
-c, --check The file to check against; you must pass this.
-ss, --ssheet The sheet to check against (for src).
-cs, --csheet The sheet to check against (for check).
-sc, --scolumn The column to check against (for src) as a string (i.e. not an index)
-cc, --ccolumn The column to check against (for check) as a string (i.e. not an index)
-o, --output The path of an output file to store the output in.
-q, --quiet Be quiet: do not return the results to stdout.
This means this script does not show if there are any
missing unless you also pass -o.
`)
os.Exit(0)
}
func parseArgs(args []string) {
var check bool = false
for i := 0; i < len(args); i++ {
arg := args[i]
switch arg {
case "-h", "--help", "help":
usage()
case "-c", "--check", "--ck":
i++
g_ckfile = args[i]
check = true
case "-cs", "--csheet", "--check-sheet", "--ck-sheet":
i++
g_cksheet = args[i]
case "-cc", "--ccolumn", "--check-column", "--ck-column":
i++
g_ckcol = args[i]
case "-ss", "--ssheet", "--source-sheet", "--src-sheet":
i++
g_srcsheet = args[i]
case "-sc", "--scolumn", "--source-column", "--src-column":
i++
g_srccol = args[i]
case "-o", "--out", "--output":
i++
g_out = args[i]
case "-q", "--quiet": // Do not print to stdout.
quiet = true
default:
g_srcfile = arg
}
}
if !check {
fmt.Println("You need to pass --check.")
os.Exit(-1)
}
if quiet && g_out == "" {
fmt.Println("You must pass --output if you pass -quiet.")
os.Exit(-1)
}
}
// Global Variables
var g_ckfile string
var g_cksheet string
var g_ckcol string
var g_srcfile string
var g_srcsheet string
var g_srccol string
var g_out string
var quiet bool = false
func main() {
args := os.Args
parseArgs(args)
/* Open the check and source files. */
// Load check file.
ck, err := xl.OpenFile(g_ckfile)
if err != nil {
fmt.Println("Could not open check file.")
return
}
// Load src file.
src, err := xl.OpenFile(g_srcfile)
if err != nil {
fmt.Println("Could not open src file.")
return
}
/* Select the sheet and the column to operate on for the two files. */
fmt.Println("Load the check file (you may be asked questions here.)")
cksheet := st.SelectSheet(ck, g_cksheet)
ckcol := st.SelectHeader(ck, cksheet, g_ckcol, /* exact: */ false)
fmt.Println("------ ------")
fmt.Println("Load the source file now (you may be asked questions here.)")
fmt.Println("------ ------")
srcsheet := st.SelectSheet(src, g_srcsheet)
srccol := st.SelectHeader(src, srcsheet, g_srccol, /* exact: */ false)
/* Grab the columns of each files which are to be processed with. */
ckrows, err := ck.GetCols(cksheet)
if err != nil {
fmt.Printf("Could not get the rows of sheet %s of the checkfile.\n", g_cksheet)
return
}
srcrows, err := src.GetCols(srcsheet)
if err != nil {
fmt.Printf("Could not get the rows of sheet %s of the sourcefile.\n", g_srcsheet)
return
}
ckrow := ckrows[ckcol]
srcrow := srcrows[srccol]
// Output what is checked against what.
// Actually, like, do the checks.
missing := bt.Missing(ckrow, srcrow)
// Write the output to stdout and to a file if -o passed.
printOutput(missing, g_out, cksheet, srcsheet, ckcol, srccol)
}
func writeBoth(quiet, write bool, file *os.File, str, errstr string) {
if !quiet { fmt.Printf(str) }
if write {
_, err := file.WriteString(str)
if err != nil {
fmt.Printf("Could not write to file %d", errstr)
}
}
}
func printOutput[T comparable](missing []bt.MissingValue[T], outputFile string,
cksheet, srcsheet string,
ckcol, srccol int) {
/* Determine whether to write to an --out file and open it if we are. */
writeFile := false
out, err := os.Create(outputFile)
if outputFile != "" && err != nil {
fmt.Println("Cannot open file to output.")
} else {
writeFile = true
}
/* The data which was checked against. */
writeBoth(quiet, writeFile, out, "--- Check File Information ---\n", "check file info")
writeBoth(quiet, writeFile, out, fmt.Sprintf("Filename: %s\n", g_ckfile), "check filename")
writeBoth(quiet, writeFile, out, fmt.Sprintf("Sheet: %s\n", cksheet), "check sheet")
writeBoth(quiet, writeFile, out, fmt.Sprintf("Column: %d\n", ckcol), "check column")
writeBoth(quiet, writeFile, out, "--- Source File Information ---\n", "source file info")
writeBoth(quiet, writeFile, out, fmt.Sprintf("Filename: %s\n", g_srcfile), "check filename")
writeBoth(quiet, writeFile, out, fmt.Sprintf("Sheet: %s\n", srcsheet), "source sheet")
writeBoth(quiet, writeFile, out, fmt.Sprintf("Column: %d\n", srccol), "source column")
/* Write all missing entries. */
for _, m := range missing {
str := fmt.Sprintf("Missing: \"%s\" at index %d.\n", m.Value, m.Index)
if !quiet { fmt.Printf(str) }
if writeFile {
_, err := out.WriteString(str)
if err != nil {
fmt.Printf("Cannot write missing entry %d to file\n", m.Index)
}
}
}
/* Write total missing entries. */
str := fmt.Sprintf("Total Missing: %d\n", len(missing))
if !quiet { fmt.Printf(str) }
if writeFile {
_, err := out.WriteString(str)
if err != nil {
fmt.Printf("Could not write total missing to file.")
}
}
}
|