Home | History | Annotate | Download | only in etc1
      1 // Copyright 2009 Google Inc.
      2 //
      3 // Licensed under the Apache License, Version 2.0 (the "License");
      4 // you may not use this file except in compliance with the License.
      5 // You may obtain a copy of the License at
      6 //
      7 //     http://www.apache.org/licenses/LICENSE-2.0
      8 //
      9 // Unless required by applicable law or agreed to in writing, software
     10 // distributed under the License is distributed on an "AS IS" BASIS,
     11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
     12 // See the License for the specific language governing permissions and
     13 // limitations under the License.
     14 
     15 //////////////////////////////////////////////////////////////////////////////////////////
     16 
     17 // This is a fork of the AOSP project ETC1 codec. The original code can be found
     18 // at the following web site:
     19 // https://android.googlesource.com/platform/frameworks/native/+/master/opengl/include/ETC1/
     20 
     21 //////////////////////////////////////////////////////////////////////////////////////////
     22 
     23 #include "etc1.h"
     24 
     25 #include <cstring>
     26 
     27 /* From http://www.khronos.org/registry/gles/extensions/OES/OES_compressed_ETC1_RGB8_texture.txt
     28 
     29  The number of bits that represent a 4x4 texel block is 64 bits if
     30  <internalformat> is given by ETC1_RGB8_OES.
     31 
     32  The data for a block is a number of bytes,
     33 
     34  {q0, q1, q2, q3, q4, q5, q6, q7}
     35 
     36  where byte q0 is located at the lowest memory address and q7 at
     37  the highest. The 64 bits specifying the block is then represented
     38  by the following 64 bit integer:
     39 
     40  int64bit = 256*(256*(256*(256*(256*(256*(256*q0+q1)+q2)+q3)+q4)+q5)+q6)+q7;
     41 
     42  ETC1_RGB8_OES:
     43 
     44  a) bit layout in bits 63 through 32 if diffbit = 0
     45 
     46  63 62 61 60 59 58 57 56 55 54 53 52 51 50 49 48
     47  -----------------------------------------------
     48  | base col1 | base col2 | base col1 | base col2 |
     49  | R1 (4bits)| R2 (4bits)| G1 (4bits)| G2 (4bits)|
     50  -----------------------------------------------
     51 
     52  47 46 45 44 43 42 41 40 39 38 37 36 35 34  33  32
     53  ---------------------------------------------------
     54  | base col1 | base col2 | table  | table  |diff|flip|
     55  | B1 (4bits)| B2 (4bits)| cw 1   | cw 2   |bit |bit |
     56  ---------------------------------------------------
     57 
     58 
     59  b) bit layout in bits 63 through 32 if diffbit = 1
     60 
     61  63 62 61 60 59 58 57 56 55 54 53 52 51 50 49 48
     62  -----------------------------------------------
     63  | base col1    | dcol 2 | base col1    | dcol 2 |
     64  | R1' (5 bits) | dR2    | G1' (5 bits) | dG2    |
     65  -----------------------------------------------
     66 
     67  47 46 45 44 43 42 41 40 39 38 37 36 35 34  33  32
     68  ---------------------------------------------------
     69  | base col 1   | dcol 2 | table  | table  |diff|flip|
     70  | B1' (5 bits) | dB2    | cw 1   | cw 2   |bit |bit |
     71  ---------------------------------------------------
     72 
     73 
     74  c) bit layout in bits 31 through 0 (in both cases)
     75 
     76  31 30 29 28 27 26 25 24 23 22 21 20 19 18 17 16
     77  -----------------------------------------------
     78  |       most significant pixel index bits       |
     79  | p| o| n| m| l| k| j| i| h| g| f| e| d| c| b| a|
     80  -----------------------------------------------
     81 
     82  15 14 13 12 11 10  9  8  7  6  5  4  3   2   1  0
     83  --------------------------------------------------
     84  |         least significant pixel index bits       |
     85  | p| o| n| m| l| k| j| i| h| g| f| e| d| c | b | a |
     86  --------------------------------------------------
     87 
     88 
     89  Add table 3.17.2: Intensity modifier sets for ETC1 compressed textures:
     90 
     91  table codeword                modifier table
     92  ------------------        ----------------------
     93  0                     -8  -2  2   8
     94  1                    -17  -5  5  17
     95  2                    -29  -9  9  29
     96  3                    -42 -13 13  42
     97  4                    -60 -18 18  60
     98  5                    -80 -24 24  80
     99  6                   -106 -33 33 106
    100  7                   -183 -47 47 183
    101 
    102 
    103  Add table 3.17.3 Mapping from pixel index values to modifier values for
    104  ETC1 compressed textures:
    105 
    106  pixel index value
    107  ---------------
    108  msb     lsb           resulting modifier value
    109  -----   -----          -------------------------
    110  1       1            -b (large negative value)
    111  1       0            -a (small negative value)
    112  0       0             a (small positive value)
    113  0       1             b (large positive value)
    114 
    115 
    116  */
    117 
    118 static const int kModifierTable[] = {
    119 /* 0 */2, 8, -2, -8,
    120 /* 1 */5, 17, -5, -17,
    121 /* 2 */9, 29, -9, -29,
    122 /* 3 */13, 42, -13, -42,
    123 /* 4 */18, 60, -18, -60,
    124 /* 5 */24, 80, -24, -80,
    125 /* 6 */33, 106, -33, -106,
    126 /* 7 */47, 183, -47, -183 };
    127 
    128 static const int kLookup[8] = { 0, 1, 2, 3, -4, -3, -2, -1 };
    129 
    130 static inline etc1_byte clamp(int x) {
    131     return (etc1_byte) (x >= 0 ? (x < 255 ? x : 255) : 0);
    132 }
    133 
    134 static
    135 inline int convert4To8(int b) {
    136     int c = b & 0xf;
    137     return (c << 4) | c;
    138 }
    139 
    140 static
    141 inline int convert5To8(int b) {
    142     int c = b & 0x1f;
    143     return (c << 3) | (c >> 2);
    144 }
    145 
    146 static
    147 inline int convert6To8(int b) {
    148     int c = b & 0x3f;
    149     return (c << 2) | (c >> 4);
    150 }
    151 
    152 static
    153 inline int divideBy255(int d) {
    154     return (d + 128 + (d >> 8)) >> 8;
    155 }
    156 
    157 static
    158 inline int convert8To4(int b) {
    159     int c = b & 0xff;
    160     return divideBy255(c * 15);
    161 }
    162 
    163 static
    164 inline int convert8To5(int b) {
    165     int c = b & 0xff;
    166     return divideBy255(c * 31);
    167 }
    168 
    169 static
    170 inline int convertDiff(int base, int diff) {
    171     return convert5To8((0x1f & base) + kLookup[0x7 & diff]);
    172 }
    173 
    174 static
    175 void decode_subblock(etc1_byte* pOut, int r, int g, int b, const int* table,
    176         etc1_uint32 low, bool second, bool flipped) {
    177     int baseX = 0;
    178     int baseY = 0;
    179     if (second) {
    180         if (flipped) {
    181             baseY = 2;
    182         } else {
    183             baseX = 2;
    184         }
    185     }
    186     for (int i = 0; i < 8; i++) {
    187         int x, y;
    188         if (flipped) {
    189             x = baseX + (i >> 1);
    190             y = baseY + (i & 1);
    191         } else {
    192             x = baseX + (i >> 2);
    193             y = baseY + (i & 3);
    194         }
    195         int k = y + (x * 4);
    196         int offset = ((low >> k) & 1) | ((low >> (k + 15)) & 2);
    197         int delta = table[offset];
    198         etc1_byte* q = pOut + 3 * (x + 4 * y);
    199         *q++ = clamp(r + delta);
    200         *q++ = clamp(g + delta);
    201         *q++ = clamp(b + delta);
    202     }
    203 }
    204 
    205 // Input is an ETC1 compressed version of the data.
    206 // Output is a 4 x 4 square of 3-byte pixels in form R, G, B
    207 
    208 void etc1_decode_block(const etc1_byte* pIn, etc1_byte* pOut) {
    209     etc1_uint32 high = (pIn[0] << 24) | (pIn[1] << 16) | (pIn[2] << 8) | pIn[3];
    210     etc1_uint32 low = (pIn[4] << 24) | (pIn[5] << 16) | (pIn[6] << 8) | pIn[7];
    211     int r1, r2, g1, g2, b1, b2;
    212     if (high & 2) {
    213         // differential
    214         int rBase = high >> 27;
    215         int gBase = high >> 19;
    216         int bBase = high >> 11;
    217         r1 = convert5To8(rBase);
    218         r2 = convertDiff(rBase, high >> 24);
    219         g1 = convert5To8(gBase);
    220         g2 = convertDiff(gBase, high >> 16);
    221         b1 = convert5To8(bBase);
    222         b2 = convertDiff(bBase, high >> 8);
    223     } else {
    224         // not differential
    225         r1 = convert4To8(high >> 28);
    226         r2 = convert4To8(high >> 24);
    227         g1 = convert4To8(high >> 20);
    228         g2 = convert4To8(high >> 16);
    229         b1 = convert4To8(high >> 12);
    230         b2 = convert4To8(high >> 8);
    231     }
    232     int tableIndexA = 7 & (high >> 5);
    233     int tableIndexB = 7 & (high >> 2);
    234     const int* tableA = kModifierTable + tableIndexA * 4;
    235     const int* tableB = kModifierTable + tableIndexB * 4;
    236     bool flipped = (high & 1) != 0;
    237     decode_subblock(pOut, r1, g1, b1, tableA, low, false, flipped);
    238     decode_subblock(pOut, r2, g2, b2, tableB, low, true, flipped);
    239 }
    240 
    241 typedef struct {
    242     etc1_uint32 high;
    243     etc1_uint32 low;
    244     etc1_uint32 score; // Lower is more accurate
    245 } etc_compressed;
    246 
    247 static
    248 inline void take_best(etc_compressed* a, const etc_compressed* b) {
    249     if (a->score > b->score) {
    250         *a = *b;
    251     }
    252 }
    253 
    254 static
    255 void etc_average_colors_subblock(const etc1_byte* pIn, etc1_uint32 inMask,
    256         etc1_byte* pColors, bool flipped, bool second) {
    257     int r = 0;
    258     int g = 0;
    259     int b = 0;
    260 
    261     if (flipped) {
    262         int by = 0;
    263         if (second) {
    264             by = 2;
    265         }
    266         for (int y = 0; y < 2; y++) {
    267             int yy = by + y;
    268             for (int x = 0; x < 4; x++) {
    269                 int i = x + 4 * yy;
    270                 if (inMask & (1 << i)) {
    271                     const etc1_byte* p = pIn + i * 3;
    272                     r += *(p++);
    273                     g += *(p++);
    274                     b += *(p++);
    275                 }
    276             }
    277         }
    278     } else {
    279         int bx = 0;
    280         if (second) {
    281             bx = 2;
    282         }
    283         for (int y = 0; y < 4; y++) {
    284             for (int x = 0; x < 2; x++) {
    285                 int xx = bx + x;
    286                 int i = xx + 4 * y;
    287                 if (inMask & (1 << i)) {
    288                     const etc1_byte* p = pIn + i * 3;
    289                     r += *(p++);
    290                     g += *(p++);
    291                     b += *(p++);
    292                 }
    293             }
    294         }
    295     }
    296     pColors[0] = (etc1_byte)((r + 4) >> 3);
    297     pColors[1] = (etc1_byte)((g + 4) >> 3);
    298     pColors[2] = (etc1_byte)((b + 4) >> 3);
    299 }
    300 
    301 static
    302 inline int square(int x) {
    303     return x * x;
    304 }
    305 
    306 static etc1_uint32 chooseModifier(const etc1_byte* pBaseColors,
    307         const etc1_byte* pIn, etc1_uint32 *pLow, int bitIndex,
    308         const int* pModifierTable) {
    309     etc1_uint32 bestScore = ~0;
    310     int bestIndex = 0;
    311     int pixelR = pIn[0];
    312     int pixelG = pIn[1];
    313     int pixelB = pIn[2];
    314     int r = pBaseColors[0];
    315     int g = pBaseColors[1];
    316     int b = pBaseColors[2];
    317     for (int i = 0; i < 4; i++) {
    318         int modifier = pModifierTable[i];
    319         int decodedG = clamp(g + modifier);
    320         etc1_uint32 score = (etc1_uint32) (6 * square(decodedG - pixelG));
    321         if (score >= bestScore) {
    322             continue;
    323         }
    324         int decodedR = clamp(r + modifier);
    325         score += (etc1_uint32) (3 * square(decodedR - pixelR));
    326         if (score >= bestScore) {
    327             continue;
    328         }
    329         int decodedB = clamp(b + modifier);
    330         score += (etc1_uint32) square(decodedB - pixelB);
    331         if (score < bestScore) {
    332             bestScore = score;
    333             bestIndex = i;
    334         }
    335     }
    336     etc1_uint32 lowMask = (((bestIndex >> 1) << 16) | (bestIndex & 1))
    337             << bitIndex;
    338     *pLow |= lowMask;
    339     return bestScore;
    340 }
    341 
    342 static
    343 void etc_encode_subblock_helper(const etc1_byte* pIn, etc1_uint32 inMask,
    344         etc_compressed* pCompressed, bool flipped, bool second,
    345         const etc1_byte* pBaseColors, const int* pModifierTable) {
    346     int score = pCompressed->score;
    347     if (flipped) {
    348         int by = 0;
    349         if (second) {
    350             by = 2;
    351         }
    352         for (int y = 0; y < 2; y++) {
    353             int yy = by + y;
    354             for (int x = 0; x < 4; x++) {
    355                 int i = x + 4 * yy;
    356                 if (inMask & (1 << i)) {
    357                     score += chooseModifier(pBaseColors, pIn + i * 3,
    358                             &pCompressed->low, yy + x * 4, pModifierTable);
    359                 }
    360             }
    361         }
    362     } else {
    363         int bx = 0;
    364         if (second) {
    365             bx = 2;
    366         }
    367         for (int y = 0; y < 4; y++) {
    368             for (int x = 0; x < 2; x++) {
    369                 int xx = bx + x;
    370                 int i = xx + 4 * y;
    371                 if (inMask & (1 << i)) {
    372                     score += chooseModifier(pBaseColors, pIn + i * 3,
    373                             &pCompressed->low, y + xx * 4, pModifierTable);
    374                 }
    375             }
    376         }
    377     }
    378     pCompressed->score = score;
    379 }
    380 
    381 static bool inRange4bitSigned(int color) {
    382     return color >= -4 && color <= 3;
    383 }
    384 
    385 static void etc_encodeBaseColors(etc1_byte* pBaseColors,
    386         const etc1_byte* pColors, etc_compressed* pCompressed) {
    387     int r1, g1, b1, r2, g2, b2; // 8 bit base colors for sub-blocks
    388     bool differential;
    389     {
    390         int r51 = convert8To5(pColors[0]);
    391         int g51 = convert8To5(pColors[1]);
    392         int b51 = convert8To5(pColors[2]);
    393         int r52 = convert8To5(pColors[3]);
    394         int g52 = convert8To5(pColors[4]);
    395         int b52 = convert8To5(pColors[5]);
    396 
    397         r1 = convert5To8(r51);
    398         g1 = convert5To8(g51);
    399         b1 = convert5To8(b51);
    400 
    401         int dr = r52 - r51;
    402         int dg = g52 - g51;
    403         int db = b52 - b51;
    404 
    405         differential = inRange4bitSigned(dr) && inRange4bitSigned(dg)
    406                 && inRange4bitSigned(db);
    407         if (differential) {
    408             r2 = convert5To8(r51 + dr);
    409             g2 = convert5To8(g51 + dg);
    410             b2 = convert5To8(b51 + db);
    411             pCompressed->high |= (r51 << 27) | ((7 & dr) << 24) | (g51 << 19)
    412                     | ((7 & dg) << 16) | (b51 << 11) | ((7 & db) << 8) | 2;
    413         }
    414     }
    415 
    416     if (!differential) {
    417         int r41 = convert8To4(pColors[0]);
    418         int g41 = convert8To4(pColors[1]);
    419         int b41 = convert8To4(pColors[2]);
    420         int r42 = convert8To4(pColors[3]);
    421         int g42 = convert8To4(pColors[4]);
    422         int b42 = convert8To4(pColors[5]);
    423         r1 = convert4To8(r41);
    424         g1 = convert4To8(g41);
    425         b1 = convert4To8(b41);
    426         r2 = convert4To8(r42);
    427         g2 = convert4To8(g42);
    428         b2 = convert4To8(b42);
    429         pCompressed->high |= (r41 << 28) | (r42 << 24) | (g41 << 20) | (g42
    430                 << 16) | (b41 << 12) | (b42 << 8);
    431     }
    432     pBaseColors[0] = r1;
    433     pBaseColors[1] = g1;
    434     pBaseColors[2] = b1;
    435     pBaseColors[3] = r2;
    436     pBaseColors[4] = g2;
    437     pBaseColors[5] = b2;
    438 }
    439 
    440 static
    441 void etc_encode_block_helper(const etc1_byte* pIn, etc1_uint32 inMask,
    442         const etc1_byte* pColors, etc_compressed* pCompressed, bool flipped) {
    443     pCompressed->score = ~0;
    444     pCompressed->high = (flipped ? 1 : 0);
    445     pCompressed->low = 0;
    446 
    447     etc1_byte pBaseColors[6];
    448 
    449     etc_encodeBaseColors(pBaseColors, pColors, pCompressed);
    450 
    451     int originalHigh = pCompressed->high;
    452 
    453     const int* pModifierTable = kModifierTable;
    454     for (int i = 0; i < 8; i++, pModifierTable += 4) {
    455         etc_compressed temp;
    456         temp.score = 0;
    457         temp.high = originalHigh | (i << 5);
    458         temp.low = 0;
    459         etc_encode_subblock_helper(pIn, inMask, &temp, flipped, false,
    460                 pBaseColors, pModifierTable);
    461         take_best(pCompressed, &temp);
    462     }
    463     pModifierTable = kModifierTable;
    464     etc_compressed firstHalf = *pCompressed;
    465     for (int i = 0; i < 8; i++, pModifierTable += 4) {
    466         etc_compressed temp;
    467         temp.score = firstHalf.score;
    468         temp.high = firstHalf.high | (i << 2);
    469         temp.low = firstHalf.low;
    470         etc_encode_subblock_helper(pIn, inMask, &temp, flipped, true,
    471                 pBaseColors + 3, pModifierTable);
    472         if (i == 0) {
    473             *pCompressed = temp;
    474         } else {
    475             take_best(pCompressed, &temp);
    476         }
    477     }
    478 }
    479 
    480 static void writeBigEndian(etc1_byte* pOut, etc1_uint32 d) {
    481     pOut[0] = (etc1_byte)(d >> 24);
    482     pOut[1] = (etc1_byte)(d >> 16);
    483     pOut[2] = (etc1_byte)(d >> 8);
    484     pOut[3] = (etc1_byte) d;
    485 }
    486 
    487 // Input is a 4 x 4 square of 3-byte pixels in form R, G, B
    488 // inmask is a 16-bit mask where bit (1 << (x + y * 4)) tells whether the corresponding (x,y)
    489 // pixel is valid or not. Invalid pixel color values are ignored when compressing.
    490 // Output is an ETC1 compressed version of the data.
    491 
    492 void etc1_encode_block(const etc1_byte* pIn, etc1_uint32 inMask,
    493         etc1_byte* pOut) {
    494     etc1_byte colors[6];
    495     etc1_byte flippedColors[6];
    496     etc_average_colors_subblock(pIn, inMask, colors, false, false);
    497     etc_average_colors_subblock(pIn, inMask, colors + 3, false, true);
    498     etc_average_colors_subblock(pIn, inMask, flippedColors, true, false);
    499     etc_average_colors_subblock(pIn, inMask, flippedColors + 3, true, true);
    500 
    501     etc_compressed a, b;
    502     etc_encode_block_helper(pIn, inMask, colors, &a, false);
    503     etc_encode_block_helper(pIn, inMask, flippedColors, &b, true);
    504     take_best(&a, &b);
    505     writeBigEndian(pOut, a.high);
    506     writeBigEndian(pOut + 4, a.low);
    507 }
    508 
    509 // Return the size of the encoded image data (does not include size of PKM header).
    510 
    511 etc1_uint32 etc1_get_encoded_data_size(etc1_uint32 width, etc1_uint32 height) {
    512     return (((width + 3) & ~3) * ((height + 3) & ~3)) >> 1;
    513 }
    514 
    515 // Encode an entire image.
    516 // pIn - pointer to the image data. Formatted such that the Red component of
    517 //       pixel (x,y) is at pIn + pixelSize * x + stride * y + redOffset;
    518 // pOut - pointer to encoded data. Must be large enough to store entire encoded image.
    519 
    520 int etc1_encode_image(const etc1_byte* pIn, etc1_uint32 width, etc1_uint32 height,
    521         etc1_uint32 pixelSize, etc1_uint32 stride, etc1_byte* pOut) {
    522     if (pixelSize < 2 || pixelSize > 3) {
    523         return -1;
    524     }
    525     static const unsigned short kYMask[] = { 0x0, 0xf, 0xff, 0xfff, 0xffff };
    526     static const unsigned short kXMask[] = { 0x0, 0x1111, 0x3333, 0x7777,
    527             0xffff };
    528     etc1_byte block[ETC1_DECODED_BLOCK_SIZE];
    529     etc1_byte encoded[ETC1_ENCODED_BLOCK_SIZE];
    530 
    531     etc1_uint32 encodedWidth = (width + 3) & ~3;
    532     etc1_uint32 encodedHeight = (height + 3) & ~3;
    533 
    534     for (etc1_uint32 y = 0; y < encodedHeight; y += 4) {
    535         etc1_uint32 yEnd = height - y;
    536         if (yEnd > 4) {
    537             yEnd = 4;
    538         }
    539         int ymask = kYMask[yEnd];
    540         for (etc1_uint32 x = 0; x < encodedWidth; x += 4) {
    541             etc1_uint32 xEnd = width - x;
    542             if (xEnd > 4) {
    543                 xEnd = 4;
    544             }
    545             int mask = ymask & kXMask[xEnd];
    546             for (etc1_uint32 cy = 0; cy < yEnd; cy++) {
    547                 etc1_byte* q = block + (cy * 4) * 3;
    548                 const etc1_byte* p = pIn + pixelSize * x + stride * (y + cy);
    549                 if (pixelSize == 3) {
    550                     memcpy(q, p, xEnd * 3);
    551                 } else {
    552                     for (etc1_uint32 cx = 0; cx < xEnd; cx++) {
    553                         int pixel = (p[1] << 8) | p[0];
    554                         *q++ = convert5To8(pixel >> 11);
    555                         *q++ = convert6To8(pixel >> 5);
    556                         *q++ = convert5To8(pixel);
    557                         p += pixelSize;
    558                     }
    559                 }
    560             }
    561             etc1_encode_block(block, mask, encoded);
    562             memcpy(pOut, encoded, sizeof(encoded));
    563             pOut += sizeof(encoded);
    564         }
    565     }
    566     return 0;
    567 }
    568 
    569 // Decode an entire image.
    570 // pIn - pointer to encoded data.
    571 // pOut - pointer to the image data. Will be written such that the Red component of
    572 //       pixel (x,y) is at pIn + pixelSize * x + stride * y + redOffset. Must be
    573 //        large enough to store entire image.
    574 
    575 
    576 int etc1_decode_image(const etc1_byte* pIn, etc1_byte* pOut,
    577         etc1_uint32 width, etc1_uint32 height,
    578         etc1_uint32 pixelSize, etc1_uint32 stride) {
    579     if (pixelSize < 2 || pixelSize > 3) {
    580         return -1;
    581     }
    582     etc1_byte block[ETC1_DECODED_BLOCK_SIZE];
    583 
    584     etc1_uint32 encodedWidth = (width + 3) & ~3;
    585     etc1_uint32 encodedHeight = (height + 3) & ~3;
    586 
    587     for (etc1_uint32 y = 0; y < encodedHeight; y += 4) {
    588         etc1_uint32 yEnd = height - y;
    589         if (yEnd > 4) {
    590             yEnd = 4;
    591         }
    592         for (etc1_uint32 x = 0; x < encodedWidth; x += 4) {
    593             etc1_uint32 xEnd = width - x;
    594             if (xEnd > 4) {
    595                 xEnd = 4;
    596             }
    597             etc1_decode_block(pIn, block);
    598             pIn += ETC1_ENCODED_BLOCK_SIZE;
    599             for (etc1_uint32 cy = 0; cy < yEnd; cy++) {
    600                 const etc1_byte* q = block + (cy * 4) * 3;
    601                 etc1_byte* p = pOut + pixelSize * x + stride * (y + cy);
    602                 if (pixelSize == 3) {
    603                     memcpy(p, q, xEnd * 3);
    604                 } else {
    605                     for (etc1_uint32 cx = 0; cx < xEnd; cx++) {
    606                         etc1_byte r = *q++;
    607                         etc1_byte g = *q++;
    608                         etc1_byte b = *q++;
    609                         etc1_uint32 pixel = ((r >> 3) << 11) | ((g >> 2) << 5) | (b >> 3);
    610                         *p++ = (etc1_byte) pixel;
    611                         *p++ = (etc1_byte) (pixel >> 8);
    612                     }
    613                 }
    614             }
    615         }
    616     }
    617     return 0;
    618 }
    619 
    620 static const char kMagic[] = { 'P', 'K', 'M', ' ', '1', '0' };
    621 
    622 static const etc1_uint32 ETC1_PKM_FORMAT_OFFSET = 6;
    623 static const etc1_uint32 ETC1_PKM_ENCODED_WIDTH_OFFSET = 8;
    624 static const etc1_uint32 ETC1_PKM_ENCODED_HEIGHT_OFFSET = 10;
    625 static const etc1_uint32 ETC1_PKM_WIDTH_OFFSET = 12;
    626 static const etc1_uint32 ETC1_PKM_HEIGHT_OFFSET = 14;
    627 
    628 static const etc1_uint32 ETC1_RGB_NO_MIPMAPS = 0;
    629 
    630 static void writeBEUint16(etc1_byte* pOut, etc1_uint32 data) {
    631     pOut[0] = (etc1_byte) (data >> 8);
    632     pOut[1] = (etc1_byte) data;
    633 }
    634 
    635 static etc1_uint32 readBEUint16(const etc1_byte* pIn) {
    636     return (pIn[0] << 8) | pIn[1];
    637 }
    638 
    639 // Format a PKM header
    640 
    641 void etc1_pkm_format_header(etc1_byte* pHeader, etc1_uint32 width, etc1_uint32 height) {
    642     memcpy(pHeader, kMagic, sizeof(kMagic));
    643     etc1_uint32 encodedWidth = (width + 3) & ~3;
    644     etc1_uint32 encodedHeight = (height + 3) & ~3;
    645     writeBEUint16(pHeader + ETC1_PKM_FORMAT_OFFSET, ETC1_RGB_NO_MIPMAPS);
    646     writeBEUint16(pHeader + ETC1_PKM_ENCODED_WIDTH_OFFSET, encodedWidth);
    647     writeBEUint16(pHeader + ETC1_PKM_ENCODED_HEIGHT_OFFSET, encodedHeight);
    648     writeBEUint16(pHeader + ETC1_PKM_WIDTH_OFFSET, width);
    649     writeBEUint16(pHeader + ETC1_PKM_HEIGHT_OFFSET, height);
    650 }
    651 
    652 // Check if a PKM header is correctly formatted.
    653 
    654 etc1_bool etc1_pkm_is_valid(const etc1_byte* pHeader) {
    655     if (memcmp(pHeader, kMagic, sizeof(kMagic))) {
    656         return false;
    657     }
    658     etc1_uint32 format = readBEUint16(pHeader + ETC1_PKM_FORMAT_OFFSET);
    659     etc1_uint32 encodedWidth = readBEUint16(pHeader + ETC1_PKM_ENCODED_WIDTH_OFFSET);
    660     etc1_uint32 encodedHeight = readBEUint16(pHeader + ETC1_PKM_ENCODED_HEIGHT_OFFSET);
    661     etc1_uint32 width = readBEUint16(pHeader + ETC1_PKM_WIDTH_OFFSET);
    662     etc1_uint32 height = readBEUint16(pHeader + ETC1_PKM_HEIGHT_OFFSET);
    663     return format == ETC1_RGB_NO_MIPMAPS &&
    664             encodedWidth >= width && encodedWidth - width < 4 &&
    665             encodedHeight >= height && encodedHeight - height < 4;
    666 }
    667 
    668 // Read the image width from a PKM header
    669 
    670 etc1_uint32 etc1_pkm_get_width(const etc1_byte* pHeader) {
    671     return readBEUint16(pHeader + ETC1_PKM_WIDTH_OFFSET);
    672 }
    673 
    674 // Read the image height from a PKM header
    675 
    676 etc1_uint32 etc1_pkm_get_height(const etc1_byte* pHeader){
    677     return readBEUint16(pHeader + ETC1_PKM_HEIGHT_OFFSET);
    678 }
    679