-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathimg2ansi.go
396 lines (354 loc) · 11.7 KB
/
img2ansi.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
package img2ansi
import (
"fmt"
"gocv.io/x/gocv"
_ "image/png"
"math"
"time"
)
const (
ESC = "\u001b"
)
var (
TargetWidth = 100
ScaleFactor = 3.0
MaxChars = 1048576
Quantization = 1
KdSearch = 0
CacheThreshold = 50.0
blocks = []blockDef{
{' ', Quadrants{false, false, false, false}}, // Empty space
{'▘', Quadrants{true, false, false, false}}, // Quadrant upper left
{'▝', Quadrants{false, true, false, false}}, // Quadrant upper right
{'▀', Quadrants{true, true, false, false}}, // Upper half block
{'▖', Quadrants{false, false, true, false}}, // Quadrant lower left
{'▌', Quadrants{true, false, true, false}}, // Left half block
{'▞', Quadrants{false, true, true, false}}, // Quadrant diagonal upper right and lower left
{'▛', Quadrants{true, true, true, false}}, // Three quadrants: upper left, upper right, lower left
{'▗', Quadrants{false, false, false, true}}, // Quadrant lower right
{'▚', Quadrants{true, false, false, true}}, // Quadrant diagonal upper left and lower right
{'▐', Quadrants{false, true, false, true}}, // Right half block
{'▜', Quadrants{true, true, false, true}}, // Three quadrants: upper left, upper right, lower right
{'▄', Quadrants{false, false, true, true}}, // Lower half block
{'▙', Quadrants{true, false, true, true}}, // Three quadrants: upper left, lower left, lower right
{'▟', Quadrants{false, true, true, true}}, // Three quadrants: upper right, lower left, lower right
{'█', Quadrants{true, true, true, true}}, // Full block
}
fgAnsiRev = map[string]uint32{}
bgAnsiRev = map[string]uint32{}
fgClosestColor *[]RGB
bgClosestColor *[]RGB
lookupTable ApproximateCache
LookupHits int
LookupMisses int
BeginInitTime time.Time
BestBlockTime time.Duration
bgTree *ColorNode
fgTree *ColorNode
DistinctColors int
)
type blockDef struct {
Rune rune
Quad Quadrants
}
func init() {
lookupTable = make(ApproximateCache)
BeginInitTime = time.Now()
LookupHits = 0
LookupMisses = 0
initLab()
}
// buildReverseMap builds the reverse map for the ANSI color codes, it is
// used to look up the ANSI color code for a given RGB color.
func buildReverseMap() {
newFgAnsiRev := make(map[string]uint32)
fgAnsi.Iterate(func(key, value interface{}) {
fgColor := key.(uint32)
fgCode := value.(string)
newFgAnsiRev[fgCode] = fgColor
})
newBgAnsiRev := make(map[string]uint32)
bgAnsi.Iterate(func(key, value interface{}) {
bgColor := key.(uint32)
bgCode := value.(string)
newBgAnsiRev[bgCode] = bgColor
})
fgAnsiRev = newFgAnsiRev
bgAnsiRev = newBgAnsiRev
}
// BlockRune represents a 2x2 block of runes with foreground and
// background colors mapped in the ANSI color space. The struct contains
// a rune representing the block character, and two RGB colors representing
// the foreground and background colors of the block.
type BlockRune struct {
Rune rune
FG RGB
BG RGB
}
// Quadrants represents the four quadrants of a 2x2 block of a rune that
// can be colored independently. Each quadrant is represented by a boolean
// Value, where true indicates that the quadrant should be colored with the
// foreground color, and false indicates that the quadrant should be colored
// with the background color.
type Quadrants struct {
TopLeft bool
TopRight bool
BottomLeft bool
BottomRight bool
}
// BrownDitherForBlocks applies a modified Floyd-Steinberg dithering
// algorithm to an image operating on 2x2 blocks rather than pixels. The
// function takes an input image and a binary image with edges detected. It
// returns a BlockRune representation with the dithering algorithm applied,
// with colors quantized to the nearest ANSI color.
func BrownDitherForBlocks(
img gocv.Mat,
edges gocv.Mat,
) [][]BlockRune {
height, width := img.Rows(), img.Cols()
blockHeight, blockWidth := height/2, width/2
result := make([][]BlockRune, blockHeight)
for i := range result {
result[i] = make([]BlockRune, blockWidth)
}
for by := 0; by < blockHeight; by++ {
for bx := 0; bx < blockWidth; bx++ {
// Get the 2x2 block
block := [4]RGB{
rgbFromVecb(img.GetVecbAt(by*2, bx*2)),
rgbFromVecb(img.GetVecbAt(by*2, bx*2+1)),
rgbFromVecb(img.GetVecbAt(by*2+1, bx*2)),
rgbFromVecb(img.GetVecbAt(by*2+1, bx*2+1)),
}
// Determine if this is an edge block
isEdge := edges.GetUCharAt(by*2, bx*2) > 128 ||
edges.GetUCharAt(by*2, bx*2+1) > 128 ||
edges.GetUCharAt(by*2+1, bx*2) > 128 ||
edges.GetUCharAt(by*2+1, bx*2+1) > 128
// Find the best representation for this block
bestRune, fgColor, bgColor := findBestBlockRepresentation(
block, isEdge)
// Store the result
result[by][bx] = BlockRune{
Rune: bestRune,
FG: fgColor,
BG: bgColor,
}
// Calculate and distribute the error
for i, blockColor := range block {
y, x := by*2+i/2, bx*2+i%2
var targetColor RGB
if (bestRune & (1 << (3 - i))) != 0 {
targetColor = fgColor
} else {
targetColor = bgColor
}
colorError := blockColor.subtract(targetColor)
distributeError(img, y, x, colorError, isEdge)
}
}
}
return result
}
// findBestBlockRepresentation finds the best rune representation for a 2x2
// block of colors. The function takes the block of colors, a boolean Value
// indicating whether the block is an edge block, and returns the best rune
// representation, the foreground color, and the background color for the
// block.
func findBestBlockRepresentation(block [4]RGB, isEdge bool) (rune, RGB, RGB) {
// Map each color in the block to its closest palette color
var fgPaletteBlock [4]RGB
var bgPaletteBlock [4]RGB
for i, color := range block {
fgPaletteBlock[i] = (*fgClosestColor)[color.toUint32()]
bgPaletteBlock[i] = (*bgClosestColor)[color.toUint32()]
}
blockKey := rgbsPairToUint256(fgPaletteBlock, bgPaletteBlock)
// Check the block cache for a match
if r, fg, bg, found := lookupTable.getEntry(
blockKey, block, isEdge); found {
return r, fg, bg
}
startBlock := time.Now()
if KdSearch == 0 || DistinctColors < int(CacheThreshold) {
var bestRune rune
var bestFG, bestBG RGB
minError := math.MaxFloat64
for _, b := range blocks {
fgAnsi.Iterate(func(fg, _ interface{}) {
fgRgb := rgbFromUint32(fg.(uint32))
bgAnsi.Iterate(func(bg, _ interface{}) {
bgRgb := rgbFromUint32(bg.(uint32))
if fg != bg {
colorError := calculateBlockError(
block, b.Quad, fgRgb, bgRgb, isEdge)
if colorError < minError {
minError = colorError
bestRune = b.Rune
bestFG = fgRgb
bestBG = bgRgb
}
}
})
})
}
BestBlockTime += time.Since(startBlock)
// Add the result to the lookup table
lookupTable.addEntry(blockKey, bestRune, bestFG, bestBG, block, isEdge)
return bestRune, bestFG, bestBG
}
fgDepth := min(KdSearch, len(fgColors))
bgDepth := min(KdSearch, len(bgColors))
foregroundColors := fgTree.getCandidateColors(fgPaletteBlock, fgDepth)
backgroundColors := bgTree.getCandidateColors(bgPaletteBlock, bgDepth)
var bestRune rune
var bestFG, bestBG RGB
minError := math.MaxFloat64
for _, b := range blocks {
for _, fgWithDist := range foregroundColors {
for _, bgWithDist := range backgroundColors {
fg, bg := fgWithDist.color, bgWithDist.color
if fg == bg {
continue
}
colorError := calculateBlockError(
block, b.Quad, fg, bg, isEdge)
// Round error to reduce floating-point variability
if colorError < minError ||
(math.Abs(colorError-minError) < epsilon &&
(fg.R < bestFG.R ||
(fg.R == bestFG.R && fg.G < bestFG.G) ||
(fg.R == bestFG.R &&
fg.G == bestFG.G && fg.B < bestFG.B))) {
minError = colorError
bestRune = b.Rune
bestFG = fg
bestBG = bg
}
}
}
}
BestBlockTime += time.Since(startBlock)
// Add the result to the lookup table
lookupTable.addEntry(blockKey, bestRune, bestFG, bestBG, block, isEdge)
return bestRune, bestFG, bestBG
}
// calculateBlockError calculates the error between a 2x2 block of colors
// and a given representation of a block. The function takes the block of
// colors, the quadrants of the block representation, the foreground and
// background colors, and a boolean Value indicating whether the block is
// an edge block. It returns the error as a floating-point number.
func calculateBlockError(
block [4]RGB,
quad Quadrants,
fg, bg RGB,
isEdge bool,
) float64 {
var totalError float64
quadrants := [4]bool{
quad.TopLeft, quad.TopRight,
quad.BottomLeft, quad.BottomRight,
}
for i, color := range block {
var targetColor RGB
if quadrants[i] {
targetColor = fg
} else {
targetColor = bg
}
totalError += color.colorDistance(targetColor)
}
if isEdge {
totalError *= 0.5
}
return totalError
}
// getQuadrantsForRune returns the quadrants for a given rune character.
// The function takes a rune character and returns the quadrants for the
// corresponding block character, or an empty Quadrants struct if the
// character is not found.
func getQuadrantsForRune(char rune) Quadrants {
for _, b := range blocks {
if b.Rune == char {
return b.Quad
}
}
// Return empty quadrants if character not found
return Quadrants{}
}
// distributeError distributes the error from a pixel to its neighbors
// using the Floyd-Steinberg error diffusion algorithm. The function takes
// an image, the y and x coordinates of the pixel, the error to distribute,
// and a boolean Value indicating whether the pixel is an edge pixel.
func distributeError(img gocv.Mat, y, x int, error RGB, isEdge bool) {
height, width := img.Rows(), img.Cols()
errorScale := 1.0
if isEdge {
errorScale = 0.5 // Reduce error diffusion for edge pixels
}
diffuseError := func(y, x int, factor float64) {
if y >= 0 && y < height && x >= 0 && x < width {
pixel := rgbFromVecb(img.GetVecbAt(y, x))
newR := uint8(math.Max(0, math.Min(255,
float64(pixel.R)+float64(error.R)*factor*errorScale)))
newG := uint8(math.Max(0, math.Min(255,
float64(pixel.G)+float64(error.G)*factor*errorScale)))
newB := uint8(math.Max(0, math.Min(255,
float64(pixel.B)+float64(error.B)*factor*errorScale)))
img.SetUCharAt(y, x*3+2, newR)
img.SetUCharAt(y, x*3+1, newG)
img.SetUCharAt(y, x*3, newB)
}
}
diffuseError(y, x+1, 7.0/16.0)
diffuseError(y+1, x-1, 3.0/16.0)
diffuseError(y+1, x, 5.0/16.0)
diffuseError(y+1, x+1, 1.0/16.0)
}
// ImageToANSI converts an image to ANSI art. The function takes the path to
// an image file as a string and returns the image as an ANSI string.
func ImageToANSI(imagePath string) string {
img := gocv.IMRead(imagePath, gocv.IMReadAnyColor)
if img.Empty() {
return fmt.Sprintf("Could not read image from %s", imagePath)
}
defer func(img *gocv.Mat) {
err := img.Close()
if err != nil {
fmt.Println("Error closing image")
}
}(&img)
aspectRatio := float64(img.Cols()) / float64(img.Rows())
width := TargetWidth
height := int(float64(width) / aspectRatio / ScaleFactor)
for {
resized, edges := prepareForANSI(img, width, height)
ditheredImg := BrownDitherForBlocks(resized, edges)
// Write the scaled image to a file for debugging
if err := saveToPNG(resized, "resized.png"); err != nil {
fmt.Println(err)
}
// Write the dithered image to a file for debugging
if err := saveBlocksToPNG(ditheredImg,
"dithered.png",
len(ditheredImg[0])*8,
int(float64(len(ditheredImg)*8)*ScaleFactor),
ScaleFactor,
); err != nil {
fmt.Println(err)
}
// Write the edges image to a file for debugging
if err := saveToPNG(edges, "edges.png"); err != nil {
fmt.Println(err)
}
ansiImage := renderToAnsi(ditheredImg)
if len(ansiImage) <= MaxChars {
return ansiImage
}
width -= 2
height = int(float64(width) / aspectRatio / 2)
if width < 10 {
return "Image too large to fit within character limit"
}
}
}