From 83b4ea70c6859765e820c8da0f210daadbacfe0b Mon Sep 17 00:00:00 2001 From: George Abbott Date: Fri, 3 Nov 2023 19:35:47 +0000 Subject: Commit all --- main.go | 236 ++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 236 insertions(+) create mode 100644 main.go (limited to 'main.go') diff --git a/main.go b/main.go new file mode 100644 index 0000000..faeaf3b --- /dev/null +++ b/main.go @@ -0,0 +1,236 @@ +package main + +// Takes one file as the `src` and another as the `check` (passed via -c). +// Ensures that all entries in `check` are in `src`, returning as missing all +// entries in `check` that are missing from `src`. +// To check all that are in `src` missing in `check`, you can firstly simply +// switch around the order of parameters, or otherwise use bt-present, which +// returns either a true or false that all entries on `src` are on `check`, +// which could be used to weed out any incorrect values on `src`. + +import ( + bt "badtudexo" + st "saggytrousers" + xl "github.com/xuri/excelize/v2" + "os" + "fmt" +) + +func usage() { + fmt.Println( +`bt-missing: check whether entries on check are missing on src. + +You must pass two files: a source file (src, passed as an argument) and +a check file (check, passed with --check). This script will iterate +over all entries in the check file, and output all which are missing on +the source file. + +This script has fundmentally two uses. + +The first is: given a larger file, check all which are _not_ on the +smaller file. To perform this, run: + bt-missing -c large.xlsx small.xlsx + +The second is: expand the output of bt-present. bt-present returns a +boolean whether all entries on the source file are present in the +check file. If bt-present returns false, you may wish to get the +entries that are missing. To do this, invoke bt-missing with the +positions of the arguments reversed: + bt-present -c check.xlsx src.xlsx + bt-missing -c src.xlsx check.xlsx +This can be a little confusing - if in doubt, just switch them around +and see whichever one looks right! + +You may specify the sheet and the columns to check against as flags +here so you do not need to specify them when the script is running. + +You can additionally specify an output file with -o or --output; the +output of this command will be copied into the output file. + +If the specific sheets and columns are known, it can help to pass them +as flags, saving you to have to confirm them when the program is +running. + +Flags: +-h, --help Display this help message. +-c, --check The file to check against; you must pass this. +-ss, --ssheet The sheet to check against (for src). +-cs, --csheet The sheet to check against (for check). +-sc, --scolumn The column to check against (for src) as a string (i.e. not an index) +-cc, --ccolumn The column to check against (for check) as a string (i.e. not an index) +-o, --output The path of an output file to store the output in. +-q, --quiet Be quiet: do not return the results to stdout. + This means this script does not show if there are any + missing unless you also pass -o. +`) + os.Exit(0) +} + +func parseArgs(args []string) { + var check bool = false + + for i := 0; i < len(args); i++ { + arg := args[i] + switch arg { + case "-h", "--help", "help": + usage() + case "-c", "--check", "--ck": + i++ + g_ckfile = args[i] + check = true + case "-cs", "--csheet", "--check-sheet", "--ck-sheet": + i++ + g_cksheet = args[i] + case "-cc", "--ccolumn", "--check-column", "--ck-column": + i++ + g_ckcol = args[i] + case "-ss", "--ssheet", "--source-sheet", "--src-sheet": + i++ + g_srcsheet = args[i] + case "-sc", "--scolumn", "--source-column", "--src-column": + i++ + g_srccol = args[i] + case "-o", "--out", "--output": + i++ + g_out = args[i] + case "-q", "--quiet": // Do not print to stdout. + quiet = true + + default: + g_srcfile = arg + } + } + + if !check { + fmt.Println("You need to pass --check.") + os.Exit(-1) + } + + if quiet && g_out == "" { + fmt.Println("You must pass --output if you pass -quiet.") + os.Exit(-1) + } +} + +// Global Variables +var g_ckfile string +var g_cksheet string +var g_ckcol string +var g_srcfile string +var g_srcsheet string +var g_srccol string +var g_out string +var quiet bool = false + +func main() { + args := os.Args + parseArgs(args) + +/* Open the check and source files. */ + // Load check file. + ck, err := xl.OpenFile(g_ckfile) + if err != nil { + fmt.Println("Could not open check file.") + return + } + // Load src file. + src, err := xl.OpenFile(g_srcfile) + if err != nil { + fmt.Println("Could not open src file.") + return + } + +/* Select the sheet and the column to operate on for the two files. */ + fmt.Println("Load the check file (you may be asked questions here.)") + cksheet := st.SelectSheet(ck, g_cksheet) + ckcol := st.SelectHeader(ck, cksheet, g_ckcol, /* exact: */ false) + + + fmt.Println("------ ------") + fmt.Println("Load the source file now (you may be asked questions here.)") + fmt.Println("------ ------") + srcsheet := st.SelectSheet(src, g_srcsheet) + srccol := st.SelectHeader(src, srcsheet, g_srccol, /* exact: */ false) + +/* Grab the columns of each files which are to be processed with. */ + ckrows, err := ck.GetCols(cksheet) + if err != nil { + fmt.Printf("Could not get the rows of sheet %s of the checkfile.\n", g_cksheet) + return + } + srcrows, err := src.GetCols(srcsheet) + if err != nil { + fmt.Printf("Could not get the rows of sheet %s of the sourcefile.\n", g_srcsheet) + return + } + ckrow := ckrows[ckcol] + srcrow := srcrows[srccol] + + // Output what is checked against what. + + + // Actually, like, do the checks. + missing := bt.Missing(ckrow, srcrow) + + // Write the output to stdout and to a file if -o passed. + printOutput(missing, g_out, cksheet, srcsheet, ckcol, srccol) +} + +func writeBoth(quiet, write bool, file *os.File, str, errstr string) { + if !quiet { fmt.Printf(str) } + if write { + _, err := file.WriteString(str) + if err != nil { + fmt.Printf("Could not write to file %d", errstr) + } + } +} + +func printOutput[T comparable](missing []bt.MissingValue[T], outputFile string, + cksheet, srcsheet string, + ckcol, srccol int) { + +/* Determine whether to write to an --out file and open it if we are. */ + writeFile := false + out, err := os.Create(outputFile) + if outputFile != "" && err != nil { + fmt.Println("Cannot open file to output.") + } else { + writeFile = true + } + +/* The data which was checked against. */ + writeBoth(quiet, writeFile, out, "--- Check File Information ---\n", "check file info") + writeBoth(quiet, writeFile, out, fmt.Sprintf("Filename: %s\n", g_ckfile), "check filename") + writeBoth(quiet, writeFile, out, fmt.Sprintf("Sheet: %s\n", cksheet), "check sheet") + writeBoth(quiet, writeFile, out, fmt.Sprintf("Column: %d\n", ckcol), "check column") + + writeBoth(quiet, writeFile, out, "--- Source File Information ---\n", "source file info") + writeBoth(quiet, writeFile, out, fmt.Sprintf("Filename: %s\n", g_srcfile), "check filename") + writeBoth(quiet, writeFile, out, fmt.Sprintf("Sheet: %s\n", srcsheet), "source sheet") + writeBoth(quiet, writeFile, out, fmt.Sprintf("Column: %d\n", srccol), "source column") + + +/* Write all missing entries. */ + for _, m := range missing { + str := fmt.Sprintf("Missing: \"%s\" at index %d.\n", m.Value, m.Index) + if !quiet { fmt.Printf(str) } + if writeFile { + _, err := out.WriteString(str) + if err != nil { + fmt.Printf("Cannot write missing entry %d to file\n", m.Index) + } + } + } + +/* Write total missing entries. */ + str := fmt.Sprintf("Total Missing: %d\n", len(missing)) + if !quiet { fmt.Printf(str) } + if writeFile { + _, err := out.WriteString(str) + if err != nil { + fmt.Printf("Could not write total missing to file.") + } + } + +} -- cgit v1.2.1