summaryrefslogtreecommitdiff
path: root/split.go
blob: bfcf47424a8a1cf8a0041dfb1b4381aca66bf45f (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
package badtudexo

import (
	"fmt"
	"strings"
	"os"
	xl "git.gabbott.dev/george/excelize/v2"
	st "saggytrousers"
)

type SplitAlgorithm int 
const (
	IndivAlgorithm SplitAlgorithm = iota + 1
	GroupAlgorithm
)

const SaveDirectory string = "bt-split"

// rows [][]any must NOT include the header. 
func indivSplit(rows [][]any, header []string, index int, dir, fn string) {
	st.Log(false, "bt.indivSplit: index (%v), dir (%v), fn (%v).", index, dir, fn)
	var uniq []any
	saveDir := fmt.Sprintf("%s/%s", dir, SaveDirectory)
	st.Log(false, "bt.indivSplit: saveDir = %v\n", saveDir)
	os.Mkdir(saveDir, 0777)

	// First pass: get all the unique values. 
	for _, row := range rows {
		v := row[index]
		if !st.InSliceAny(uniq, v) {
			uniq = append(uniq, v)
		}
	}

	// Rest of the passes: for each unique value, grab them and chuck all 
	// entries matching it to a file, then save it. 
	count, total := 0, 0
	for _, v := range uniq {
		//if (n == 0) { /* change for _, ... to: for n, ... if using
		//	// Skip the first one, as it is the header.
		//	continue
		//}
		pos := 1 
		suffix := deriveSplitSuffix(v)
		filename  := st.CreateFilepath(dir, SaveDirectory, fn, suffix)
		sheetname := st.MakeValidSheetName(st.CreateFilename(fn, suffix))


		// Create the new file, and append the header to it. 
		file := xl.NewFile()
		file.SetSheetName("Sheet1", sheetname)
		st.AppendToFile(file, sheetname, header, pos)
		pos++ 

		// Now add each matching row to the file as well. 
		for _, row := range rows {
			sv := row[index]
			if sv == v {
				st.AppendToFile(file, sheetname, row, pos)
				pos++
			}
		}

		// Finally, save the file, close it, and we can do it all again 
		// for the next unique value.
		filename = fmt.Sprintf("%s.xlsx", filename) 
		if err := file.SaveAs(filename); err != nil {
			st.ErrLog(true, "Unable to save [%s]\n", filename)
		} else {
			st.Log(true, "Saved [%s]\n", filename)
			count++
		}
		total++
	}
	st.Log(true, "Saved %v of %v files successfully.\n", count, total)
}

func deriveSplitSuffix(str any) string {
	s:= fmt.Sprintf("%v", str)
	if strings.HasSuffix(s,  "UTC") {
		return s[0:10]
	}

	return s
}

// func groupSplit(rows [][]string, header []string, index int, dir, fn string) map[string]*xl.File {
// }
// 
// func groupSave(m map[string]*xl.File) { 
// }



// Takes rows, and splits on the given index. Then saves each of these splits 
// as a separate file at the specified location and with the specified name. 
// rows must NOT include the header.
func Split(rows [][]any, header []string, index int, 
                         dir, filename string, 
			 algo SplitAlgorithm) {

	switch algo {
	case IndivAlgorithm:
		st.Log(false, "badtudexo.Split: algorithm = IndivAlgorithm\n")
		indivSplit(rows, header, index, dir, filename)
	// case GroupAlgorithm:
	// 	// TODO: implement these again.
	// 	m := groupSplit(rows, header, index, dir, filename)
	// 	groupSave(m)
	default:
		st.ErrLog(true, "badtudexo.Split received an invalid algorithm.\n")
		os.Exit(-1)
	}
}