github.com/riscv/riscv-go@v0.0.0-20200123204226-124ebd6fcc8e/src/image/jpeg/dct_test.go (about) 1 // Copyright 2012 The Go Authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style 3 // license that can be found in the LICENSE file. 4 5 package jpeg 6 7 import ( 8 "bytes" 9 "fmt" 10 "math" 11 "math/rand" 12 "testing" 13 ) 14 15 func benchmarkDCT(b *testing.B, f func(*block)) { 16 b.StopTimer() 17 blocks := make([]block, 0, b.N*len(testBlocks)) 18 for i := 0; i < b.N; i++ { 19 blocks = append(blocks, testBlocks[:]...) 20 } 21 b.StartTimer() 22 for i := range blocks { 23 f(&blocks[i]) 24 } 25 } 26 27 func BenchmarkFDCT(b *testing.B) { 28 benchmarkDCT(b, fdct) 29 } 30 31 func BenchmarkIDCT(b *testing.B) { 32 benchmarkDCT(b, idct) 33 } 34 35 func TestDCT(t *testing.T) { 36 blocks := make([]block, len(testBlocks)) 37 copy(blocks, testBlocks[:]) 38 39 // Append some randomly generated blocks of varying sparseness. 40 r := rand.New(rand.NewSource(123)) 41 for i := 0; i < 100; i++ { 42 b := block{} 43 n := r.Int() % 64 44 for j := 0; j < n; j++ { 45 b[r.Int()%len(b)] = r.Int31() % 256 46 } 47 blocks = append(blocks, b) 48 } 49 50 // Check that the FDCT and IDCT functions are inverses, after a scale and 51 // level shift. Scaling reduces the rounding errors in the conversion from 52 // floats to ints. 53 for i, b := range blocks { 54 got, want := b, b 55 for j := range got { 56 got[j] = (got[j] - 128) * 8 57 } 58 slowFDCT(&got) 59 slowIDCT(&got) 60 for j := range got { 61 got[j] = got[j]/8 + 128 62 } 63 if differ(&got, &want) { 64 t.Errorf("i=%d: IDCT(FDCT)\nsrc\n%s\ngot\n%s\nwant\n%s\n", i, &b, &got, &want) 65 } 66 } 67 68 // Check that the optimized and slow FDCT implementations agree. 69 // The fdct function already does a scale and level shift. 70 for i, b := range blocks { 71 got, want := b, b 72 fdct(&got) 73 for j := range want { 74 want[j] = (want[j] - 128) * 8 75 } 76 slowFDCT(&want) 77 if differ(&got, &want) { 78 t.Errorf("i=%d: FDCT\nsrc\n%s\ngot\n%s\nwant\n%s\n", i, &b, &got, &want) 79 } 80 } 81 82 // Check that the optimized and slow IDCT implementations agree. 83 for i, b := range blocks { 84 got, want := b, b 85 idct(&got) 86 slowIDCT(&want) 87 if differ(&got, &want) { 88 t.Errorf("i=%d: IDCT\nsrc\n%s\ngot\n%s\nwant\n%s\n", i, &b, &got, &want) 89 } 90 } 91 } 92 93 // differ reports whether any pair-wise elements in b0 and b1 differ by 2 or 94 // more. That tolerance is because there isn't a single definitive decoding of 95 // a given JPEG image, even before the YCbCr to RGB conversion; implementations 96 // can have different IDCT rounding errors. 97 func differ(b0, b1 *block) bool { 98 for i := range b0 { 99 delta := b0[i] - b1[i] 100 if delta < -2 || +2 < delta { 101 return true 102 } 103 } 104 return false 105 } 106 107 // alpha returns 1 if i is 0 and returns √2 otherwise. 108 func alpha(i int) float64 { 109 if i == 0 { 110 return 1 111 } 112 return math.Sqrt2 113 } 114 115 var cosines [32]float64 // cosines[k] = cos(π/2 * k/8) 116 117 func init() { 118 for k := range cosines { 119 cosines[k] = math.Cos(math.Pi * float64(k) / 16) 120 } 121 } 122 123 // slowFDCT performs the 8*8 2-dimensional forward discrete cosine transform: 124 // 125 // dst[u,v] = (1/8) * Σ_x Σ_y alpha(u) * alpha(v) * src[x,y] * 126 // cos((π/2) * (2*x + 1) * u / 8) * 127 // cos((π/2) * (2*y + 1) * v / 8) 128 // 129 // x and y are in pixel space, and u and v are in transform space. 130 // 131 // b acts as both dst and src. 132 func slowFDCT(b *block) { 133 var dst [blockSize]float64 134 for v := 0; v < 8; v++ { 135 for u := 0; u < 8; u++ { 136 sum := 0.0 137 for y := 0; y < 8; y++ { 138 for x := 0; x < 8; x++ { 139 sum += alpha(u) * alpha(v) * float64(b[8*y+x]) * 140 cosines[((2*x+1)*u)%32] * 141 cosines[((2*y+1)*v)%32] 142 } 143 } 144 dst[8*v+u] = sum / 8 145 } 146 } 147 // Convert from float64 to int32. 148 for i := range dst { 149 b[i] = int32(dst[i] + 0.5) 150 } 151 } 152 153 // slowIDCT performs the 8*8 2-dimensional inverse discrete cosine transform: 154 // 155 // dst[x,y] = (1/8) * Σ_u Σ_v alpha(u) * alpha(v) * src[u,v] * 156 // cos((π/2) * (2*x + 1) * u / 8) * 157 // cos((π/2) * (2*y + 1) * v / 8) 158 // 159 // x and y are in pixel space, and u and v are in transform space. 160 // 161 // b acts as both dst and src. 162 func slowIDCT(b *block) { 163 var dst [blockSize]float64 164 for y := 0; y < 8; y++ { 165 for x := 0; x < 8; x++ { 166 sum := 0.0 167 for v := 0; v < 8; v++ { 168 for u := 0; u < 8; u++ { 169 sum += alpha(u) * alpha(v) * float64(b[8*v+u]) * 170 cosines[((2*x+1)*u)%32] * 171 cosines[((2*y+1)*v)%32] 172 } 173 } 174 dst[8*y+x] = sum / 8 175 } 176 } 177 // Convert from float64 to int32. 178 for i := range dst { 179 b[i] = int32(dst[i] + 0.5) 180 } 181 } 182 183 func (b *block) String() string { 184 s := bytes.NewBuffer(nil) 185 fmt.Fprintf(s, "{\n") 186 for y := 0; y < 8; y++ { 187 fmt.Fprintf(s, "\t") 188 for x := 0; x < 8; x++ { 189 fmt.Fprintf(s, "0x%04x, ", uint16(b[8*y+x])) 190 } 191 fmt.Fprintln(s) 192 } 193 fmt.Fprintf(s, "}") 194 return s.String() 195 } 196 197 // testBlocks are the first 10 pre-IDCT blocks from ../testdata/video-001.jpeg. 198 var testBlocks = [10]block{ 199 { 200 0x7f, 0xf6, 0x01, 0x07, 0xff, 0x00, 0x00, 0x00, 201 0xf5, 0x01, 0xfa, 0x01, 0xfe, 0x00, 0x01, 0x00, 202 0x05, 0x05, 0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 203 0x01, 0xff, 0xf8, 0x00, 0x01, 0xff, 0x00, 0x00, 204 0x00, 0x01, 0x00, 0x01, 0x00, 0xff, 0xff, 0x00, 205 0xff, 0x0c, 0x00, 0x00, 0x00, 0x00, 0xff, 0x01, 206 0x00, 0x00, 0x00, 0x01, 0x00, 0x00, 0x00, 0x00, 207 0x01, 0x00, 0x00, 0x01, 0xff, 0x01, 0x00, 0xfe, 208 }, 209 { 210 0x29, 0x07, 0x00, 0xfc, 0x01, 0x01, 0x00, 0x00, 211 0x07, 0x00, 0x03, 0x00, 0x01, 0x00, 0xff, 0xff, 212 0xff, 0xfd, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 213 0x00, 0x00, 0x04, 0x00, 0xff, 0x01, 0x00, 0x00, 214 0x01, 0x00, 0x01, 0xff, 0x00, 0x00, 0x00, 0x00, 215 0x01, 0xfa, 0x01, 0x00, 0x01, 0x00, 0x01, 0xff, 216 0x00, 0x00, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 217 0x00, 0x00, 0x00, 0xff, 0x00, 0xff, 0x00, 0x02, 218 }, 219 { 220 0xc5, 0xfa, 0x01, 0x00, 0x00, 0x01, 0x00, 0xff, 221 0x02, 0xff, 0x01, 0x00, 0x01, 0x00, 0xff, 0x00, 222 0xff, 0xff, 0x00, 0xff, 0x01, 0x00, 0x00, 0x00, 223 0xff, 0x00, 0x01, 0x00, 0x00, 0x00, 0xff, 0x00, 224 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 225 0x00, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 226 0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 227 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 228 }, 229 { 230 0x86, 0x05, 0x00, 0x02, 0x00, 0x00, 0x01, 0x00, 231 0xf2, 0x06, 0x00, 0x00, 0x01, 0x02, 0x00, 0x00, 232 0xf6, 0xfa, 0xf9, 0x00, 0xff, 0x01, 0x00, 0x00, 233 0xf9, 0x00, 0x00, 0xff, 0x00, 0x00, 0x00, 0x00, 234 0x00, 0xff, 0x00, 0xff, 0xff, 0xff, 0x00, 0x00, 235 0xff, 0x00, 0x00, 0x01, 0x00, 0xff, 0x01, 0x00, 236 0x00, 0x00, 0x00, 0xff, 0x00, 0x00, 0x00, 0x01, 237 0x00, 0x01, 0xff, 0x01, 0x00, 0xff, 0x00, 0x00, 238 }, 239 { 240 0x24, 0xfe, 0x00, 0xff, 0x00, 0xff, 0xff, 0x00, 241 0x08, 0xfd, 0x00, 0x01, 0x01, 0x00, 0x01, 0x00, 242 0x06, 0x03, 0x03, 0xff, 0x00, 0x00, 0x00, 0x00, 243 0x04, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 244 0x00, 0x00, 0x00, 0x00, 0x01, 0x00, 0x00, 0x01, 245 0x01, 0x00, 0x01, 0xff, 0x00, 0x01, 0x00, 0x00, 246 0x01, 0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 247 0x01, 0x00, 0x01, 0x00, 0x00, 0x00, 0xff, 0x01, 248 }, 249 { 250 0xcd, 0xff, 0x00, 0x00, 0x00, 0x00, 0x01, 0x01, 251 0x03, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 0xff, 252 0x01, 0x01, 0x01, 0x01, 0x01, 0x00, 0x00, 0x00, 253 0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 254 0x01, 0x00, 0x00, 0x00, 0x00, 0x01, 0x01, 0x00, 255 0x00, 0x00, 0x00, 0x01, 0x00, 0x00, 0x00, 0x00, 256 0x00, 0xff, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 257 0x00, 0x00, 0x00, 0x00, 0x00, 0x01, 0x00, 0xff, 258 }, 259 { 260 0x81, 0xfe, 0x05, 0xff, 0x01, 0xff, 0x01, 0x00, 261 0xef, 0xf9, 0x00, 0xf9, 0x00, 0xff, 0x00, 0xff, 262 0x05, 0xf9, 0x00, 0xf8, 0x01, 0xff, 0x01, 0xff, 263 0x00, 0xff, 0x07, 0x00, 0x01, 0x00, 0x00, 0x00, 264 0x01, 0x00, 0x01, 0x01, 0x00, 0x00, 0x00, 0x00, 265 0x01, 0x00, 0x00, 0x00, 0xff, 0xff, 0x00, 0x01, 266 0xff, 0x01, 0x01, 0x00, 0xff, 0x00, 0x00, 0x00, 267 0x01, 0x01, 0x00, 0xff, 0x00, 0x00, 0x00, 0xff, 268 }, 269 { 270 0x28, 0x00, 0xfe, 0x00, 0x00, 0x00, 0x00, 0x00, 271 0x0b, 0x02, 0x01, 0x03, 0x00, 0xff, 0x00, 0x01, 272 0xfe, 0x02, 0x01, 0x03, 0xff, 0x00, 0x00, 0x00, 273 0x01, 0x00, 0xfd, 0x00, 0x01, 0x00, 0xff, 0x00, 274 0x01, 0xff, 0x00, 0xff, 0x01, 0x00, 0x00, 0x00, 275 0x00, 0x00, 0x00, 0xff, 0x01, 0x01, 0x00, 0xff, 276 0x01, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 277 0xff, 0xff, 0x00, 0x00, 0x00, 0xff, 0x00, 0x01, 278 }, 279 { 280 0xdf, 0xf9, 0xfe, 0x00, 0x03, 0x01, 0xff, 0xff, 281 0x04, 0x01, 0x00, 0x01, 0x00, 0x00, 0x00, 0x00, 282 0xff, 0x01, 0x01, 0x01, 0x00, 0x00, 0x00, 0x01, 283 0x00, 0x00, 0xfe, 0x01, 0x00, 0x00, 0x00, 0x00, 284 0x00, 0x00, 0xff, 0x01, 0x00, 0x00, 0x00, 0x01, 285 0xff, 0x00, 0x00, 0x00, 0x00, 0x01, 0x00, 0x00, 286 0x00, 0xff, 0x00, 0xff, 0x01, 0x00, 0x00, 0x01, 287 0xff, 0xff, 0x00, 0x00, 0x00, 0x01, 0x00, 0x00, 288 }, 289 { 290 0x88, 0xfd, 0x00, 0x00, 0xff, 0x00, 0x01, 0xff, 291 0xe1, 0x06, 0x06, 0x01, 0xff, 0x00, 0x01, 0x00, 292 0x08, 0x00, 0xfa, 0x00, 0xff, 0xff, 0xff, 0xff, 293 0x08, 0x01, 0x00, 0xff, 0x01, 0xff, 0x00, 0x00, 294 0xf5, 0xff, 0x00, 0x01, 0xff, 0x01, 0x01, 0x00, 295 0xff, 0xff, 0x01, 0xff, 0x01, 0x00, 0x01, 0x00, 296 0x00, 0x01, 0x01, 0xff, 0x00, 0xff, 0x00, 0x01, 297 0x02, 0x00, 0x00, 0xff, 0xff, 0x00, 0xff, 0x00, 298 }, 299 }