-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathkdtree.go
302 lines (265 loc) · 8.52 KB
/
kdtree.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
package img2ansi
import (
"container/heap"
"sort"
)
// ColorNode represents a node in a KD-tree that stores RGB colors. Each node
// contains a color, a left child, a right child, and the axis along which the
// colors are split.
type ColorNode struct {
Color RGB
Left, Right *ColorNode
SplitAxis int
}
// buildKDTree constructs a KD-tree from a list of RGB colors, optimized for
// ANSI color matching. This implementation is particularly effective for
// ANSI art because:
//
// - It preserves subtle shade differences crucial in limited color palettes
// like ANSI.
// - It maintains determinism, ensuring consistent output across runs, which
// is important for reproducible ANSI art generation.
// - It balances the tree effectively without over-optimizing, which works
// well with the relatively small ANSI color space.
// - It handles the discrete nature of ANSI colors well by carefully
// managing axis splitting and duplicate color values.
//
// The function takes a list of colors, the current depth, and the maximum
// depth of the tree as arguments, and returns the root node of the KD-tree.
// The resulting tree structure allows for efficient nearest-neighbor
// searches in the ANSI color space, crucial for mapping arbitrary RGB colors
// to the closest ANSI representation.
func buildKDTree(colors []RGB, depth int, maxDepth int) *ColorNode {
// Base case: stop recursion if we've reached max depth or have no colors
if len(colors) == 0 || depth >= maxDepth {
return nil
}
// Choose splitting axis based on the dimension with the largest range
// This preserves the actual distribution of colors in the dataset,
// helping to maintain subtle shade differences
axis := chooseSplitAxis(colors)
// Sort colors deterministically. This ensures consistency between
// runs while minimally altering the tree structure
sort.Slice(colors, func(i, j int) bool {
iComp := getColorComponent(colors[i], axis)
jComp := getColorComponent(colors[j], axis)
if iComp != jComp {
return iComp < jComp
}
// Tie-breakers: ensure full determinism even with equal axis values
if colors[i].R != colors[j].R {
return colors[i].R < colors[j].R
}
if colors[i].G != colors[j].G {
return colors[i].G < colors[j].G
}
return colors[i].B < colors[j].B
})
median := len(colors) / 2
// Handle duplicate values at the median
// This prevents arbitrary splitting of identical colors, which could
// cause inconsistencies
for median < len(colors)-1 && getColorComponent(colors[median], axis) ==
getColorComponent(colors[median+1], axis) {
median++
}
// Create and return the node, recursively building left and right subtrees
// Using the median as split point generally creates a balanced tree
return &ColorNode{
Color: colors[median],
Left: buildKDTree(colors[:median], depth+1, maxDepth),
Right: buildKDTree(colors[median+1:], depth+1, maxDepth),
SplitAxis: axis,
}
}
// chooseSplitAxis selects the axis with the largest color range
// This helps to preserve the color variations in the dataset
func chooseSplitAxis(colors []RGB) int {
minR, maxR := colors[0].R, colors[0].R
minG, maxG := colors[0].G, colors[0].G
minB, maxB := colors[0].B, colors[0].B
// Find the min and max values for each color component
for _, c := range colors {
minR = min(minR, c.R)
maxR = max(maxR, c.R)
minG = min(minG, c.G)
maxG = max(maxG, c.G)
minB = min(minB, c.B)
maxB = max(maxB, c.B)
}
// Calculate the range for each color component
rangeR := maxR - minR
rangeG := maxG - minG
rangeB := maxB - minB
// Return the axis with the largest range
// This ensures we split along the axis with the most color variation
if rangeR >= rangeG && rangeR >= rangeB {
return 0 // R axis
} else if rangeG >= rangeB {
return 1 // G axis
}
return 2 // B axis
}
// getColorComponent returns the color component of an RGB color along the
// specified axis. The function takes an RGB color and an axis index as input
// and returns the corresponding color component.
func getColorComponent(color RGB, axis int) uint8 {
switch axis {
case 0:
return color.R
case 1:
return color.G
default:
return color.B
}
}
// getCandidateColors finds the k-nearest neighbors of the colors in a block
// using a KD-tree. The function takes a block of colors, the depth of the
// search, and the number of neighbors to find as input, and returns a slice
// of colors sorted by distance.
func (node *ColorNode) getCandidateColors(
block [4]RGB,
depth int,
) colorDistanceSlice {
// Find initial candidates using KD-tree and sort by distance
var candidateColors colorDistanceSlice
seenColors := make(map[RGB]bool)
// Process block colors in a consistent order
sortedBlockColors := make(sortableRGB, len(block))
for i, c := range block {
sortedBlockColors[i] = c
}
sort.Sort(sortedBlockColors)
for _, color := range sortedBlockColors {
nearest := node.kNearestNeighbors(color, depth)
for _, c := range nearest {
if _, seen := seenColors[c]; !seen {
distance := color.colorDistance(c)
candidateColors = append(candidateColors,
colorWithDistance{
c,
distance,
len(candidateColors)})
seenColors[c] = true
}
}
}
return candidateColors
}
// nearestNeighbor finds the nearest neighbor of a target color in a KD-tree.
// The function takes the root node of the KD-tree, the target color, the best
// color found so far, the best distance found so far, and the depth of the
// search as input, and returns the nearest neighbor and the distance to it.
func (node *ColorNode) nearestNeighbor(
target RGB, best RGB, bestDist float64, depth int) (RGB, float64) {
if node == nil {
return best, bestDist
}
dist := node.Color.colorDistance(target)
if dist < bestDist {
best = node.Color
bestDist = dist
}
axis := depth % 3
var next, other *ColorNode
switch axis {
case 0:
if target.R < node.Color.R {
next, other = node.Left, node.Right
} else {
next, other = node.Right, node.Left
}
case 1:
if target.G < node.Color.G {
next, other = node.Left, node.Right
} else {
next, other = node.Right, node.Left
}
default:
if target.B < node.Color.B {
next, other = node.Left, node.Right
} else {
next, other = node.Right, node.Left
}
}
best, bestDist = next.nearestNeighbor(target, best, bestDist, depth+1)
// Check if we need to search the other branch
var axisDistance float64
switch axis {
case 0:
axisDistance = float64(target.R - node.Color.R)
case 1:
axisDistance = float64(target.G - node.Color.G)
default:
axisDistance = float64(target.B - node.Color.B)
}
if axisDistance*axisDistance < bestDist {
best, bestDist = other.nearestNeighbor(
target, best, bestDist, depth+1)
}
return best, bestDist
}
// ColorDistance is a helper struct to keep track of colors and their
// distances
type ColorDistance struct {
color RGB
distance float64
}
// kNearestNeighbors finds the k-nearest neighbors of a target color in a
// KD-tree. The function takes the root node of the KD-tree, the target color,
// and the number of neighbors to find as input, and returns a slice of colors
// sorted by distance.
func (node *ColorNode) kNearestNeighbors(target RGB, k int) []RGB {
allColors := node.getAllColors()
if len(allColors) <= k {
return allColors
}
pq := make(PriorityQueue, 0, k)
heap.Init(&pq)
for _, color := range allColors {
dist := color.colorDistance(target)
if pq.Len() < k {
heap.Push(&pq, ColorDistance{color, dist})
} else if dist < pq[0].distance {
heap.Pop(&pq)
heap.Push(&pq, ColorDistance{color, dist})
}
}
result := make([]RGB, k)
for i := k - 1; i >= 0; i-- {
result[i] = heap.Pop(&pq).(ColorDistance).color
}
return result
}
func (node *ColorNode) getAllColors() []RGB {
if node == nil {
return nil
}
colors := []RGB{node.Color}
colors = append(colors, node.Left.getAllColors()...)
colors = append(colors, node.Right.getAllColors()...)
return colors
}
func (node *ColorNode) Serialize() []byte {
if node == nil {
return []byte{0} // Null node
}
data := []byte{1} // Non-null node
data = append(data, node.Color.R, node.Color.G, node.Color.B)
data = append(data, byte(node.SplitAxis))
data = append(data, node.Left.Serialize()...)
data = append(data, node.Right.Serialize()...)
return data
}
func DeserializeKDTree(data []byte) (*ColorNode, []byte) {
if len(data) == 0 || data[0] == 0 {
return nil, data[1:]
}
node := &ColorNode{
Color: RGB{data[1], data[2], data[3]},
SplitAxis: int(data[4]),
}
node.Left, data = DeserializeKDTree(data[5:])
node.Right, data = DeserializeKDTree(data)
return node, data
}