Blame - third_party/etc1/etc1.cpp - platform/external/skqp

blob: 421ebfebc5a4aca71cc6c78fca2f131e00b4ad70 [file] [log] [blame]

robertphillips@google.com	8cf81e0	2014-05-22 18:40:29 +0000	[diff] [blame]	1	// Copyright 2009 Google Inc.
				2	//
				3	// Licensed under the Apache License, Version 2.0 (the "License");
				4	// you may not use this file except in compliance with the License.
				5	// You may obtain a copy of the License at
				6	//
				7	// http://www.apache.org/licenses/LICENSE-2.0
				8	//
				9	// Unless required by applicable law or agreed to in writing, software
				10	// distributed under the License is distributed on an "AS IS" BASIS,
				11	// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
				12	// See the License for the specific language governing permissions and
				13	// limitations under the License.
				14
				15	//////////////////////////////////////////////////////////////////////////////////////////
				16
				17	// This is a fork of the AOSP project ETC1 codec. The original code can be found
				18	// at the following web site:
				19	// https://android.googlesource.com/platform/frameworks/native/+/master/opengl/include/ETC1/
				20
				21	//////////////////////////////////////////////////////////////////////////////////////////
				22
				23	#include "etc1.h"
				24
				25	#include <cstring>
				26
				27	/* From http://www.khronos.org/registry/gles/extensions/OES/OES_compressed_ETC1_RGB8_texture.txt
				28
				29	The number of bits that represent a 4x4 texel block is 64 bits if
				30	<internalformat> is given by ETC1_RGB8_OES.
				31
				32	The data for a block is a number of bytes,
				33
				34	{q0, q1, q2, q3, q4, q5, q6, q7}
				35
				36	where byte q0 is located at the lowest memory address and q7 at
				37	the highest. The 64 bits specifying the block is then represented
				38	by the following 64 bit integer:
				39
				40	int64bit = 256(256(256(256(256(256(256*q0+q1)+q2)+q3)+q4)+q5)+q6)+q7;
				41
				42	ETC1_RGB8_OES:
				43
				44	a) bit layout in bits 63 through 32 if diffbit = 0
				45
				46	63 62 61 60 59 58 57 56 55 54 53 52 51 50 49 48
				47	-----------------------------------------------
				48	\| base col1 \| base col2 \| base col1 \| base col2 \|
				49	\| R1 (4bits)\| R2 (4bits)\| G1 (4bits)\| G2 (4bits)\|
				50	-----------------------------------------------
				51
				52	47 46 45 44 43 42 41 40 39 38 37 36 35 34 33 32
				53	---------------------------------------------------
				54	\| base col1 \| base col2 \| table \| table \|diff\|flip\|
				55	\| B1 (4bits)\| B2 (4bits)\| cw 1 \| cw 2 \|bit \|bit \|
				56	---------------------------------------------------
				57
				58
				59	b) bit layout in bits 63 through 32 if diffbit = 1
				60
				61	63 62 61 60 59 58 57 56 55 54 53 52 51 50 49 48
				62	-----------------------------------------------
				63	\| base col1 \| dcol 2 \| base col1 \| dcol 2 \|
				64	\| R1' (5 bits) \| dR2 \| G1' (5 bits) \| dG2 \|
				65	-----------------------------------------------
				66
				67	47 46 45 44 43 42 41 40 39 38 37 36 35 34 33 32
				68	---------------------------------------------------
				69	\| base col 1 \| dcol 2 \| table \| table \|diff\|flip\|
				70	\| B1' (5 bits) \| dB2 \| cw 1 \| cw 2 \|bit \|bit \|
				71	---------------------------------------------------
				72
				73
				74	c) bit layout in bits 31 through 0 (in both cases)
				75
				76	31 30 29 28 27 26 25 24 23 22 21 20 19 18 17 16
				77	-----------------------------------------------
				78	\| most significant pixel index bits \|
				79	\| p\| o\| n\| m\| l\| k\| j\| i\| h\| g\| f\| e\| d\| c\| b\| a\|
				80	-----------------------------------------------
				81
				82	15 14 13 12 11 10 9 8 7 6 5 4 3 2 1 0
				83	--------------------------------------------------
				84	\| least significant pixel index bits \|
				85	\| p\| o\| n\| m\| l\| k\| j\| i\| h\| g\| f\| e\| d\| c \| b \| a \|
				86	--------------------------------------------------
				87
				88
				89	Add table 3.17.2: Intensity modifier sets for ETC1 compressed textures:
				90
				91	table codeword modifier table
				92	------------------ ----------------------
				93	0 -8 -2 2 8
				94	1 -17 -5 5 17
				95	2 -29 -9 9 29
				96	3 -42 -13 13 42
				97	4 -60 -18 18 60
				98	5 -80 -24 24 80
				99	6 -106 -33 33 106
				100	7 -183 -47 47 183
				101
				102
				103	Add table 3.17.3 Mapping from pixel index values to modifier values for
				104	ETC1 compressed textures:
				105
				106	pixel index value
				107	---------------
				108	msb lsb resulting modifier value
				109	----- ----- -------------------------
				110	1 1 -b (large negative value)
				111	1 0 -a (small negative value)
				112	0 0 a (small positive value)
				113	0 1 b (large positive value)
				114
				115
				116	*/
				117
				118	static const int kModifierTable[] = {
				119	/* 0 */2, 8, -2, -8,
				120	/* 1 */5, 17, -5, -17,
				121	/* 2 */9, 29, -9, -29,
				122	/* 3 */13, 42, -13, -42,
				123	/* 4 */18, 60, -18, -60,
				124	/* 5 */24, 80, -24, -80,
				125	/* 6 */33, 106, -33, -106,
				126	/* 7 */47, 183, -47, -183 };
				127
				128	static const int kLookup[8] = { 0, 1, 2, 3, -4, -3, -2, -1 };
				129
				130	static inline etc1_byte clamp(int x) {
				131	return (etc1_byte) (x >= 0 ? (x < 255 ? x : 255) : 0);
				132	}
				133
				134	static
				135	inline int convert4To8(int b) {
				136	int c = b & 0xf;
				137	return (c << 4) \| c;
				138	}
				139
				140	static
				141	inline int convert5To8(int b) {
				142	int c = b & 0x1f;
				143	return (c << 3) \| (c >> 2);
				144	}
				145
				146	static
				147	inline int convert6To8(int b) {
				148	int c = b & 0x3f;
				149	return (c << 2) \| (c >> 4);
				150	}
				151
				152	static
				153	inline int divideBy255(int d) {
				154	return (d + 128 + (d >> 8)) >> 8;
				155	}
				156
				157	static
				158	inline int convert8To4(int b) {
				159	int c = b & 0xff;
				160	return divideBy255(c * 15);
				161	}
				162
				163	static
				164	inline int convert8To5(int b) {
				165	int c = b & 0xff;
				166	return divideBy255(c * 31);
				167	}
				168
				169	static
				170	inline int convertDiff(int base, int diff) {
				171	return convert5To8((0x1f & base) + kLookup[0x7 & diff]);
				172	}
				173
				174	static
				175	void decode_subblock(etc1_byte* pOut, int r, int g, int b, const int* table,
				176	etc1_uint32 low, bool second, bool flipped) {
				177	int baseX = 0;
				178	int baseY = 0;
				179	if (second) {
				180	if (flipped) {
				181	baseY = 2;
				182	} else {
				183	baseX = 2;
				184	}
				185	}
				186	for (int i = 0; i < 8; i++) {
				187	int x, y;
				188	if (flipped) {
				189	x = baseX + (i >> 1);
				190	y = baseY + (i & 1);
				191	} else {
				192	x = baseX + (i >> 2);
				193	y = baseY + (i & 3);
				194	}
				195	int k = y + (x * 4);
				196	int offset = ((low >> k) & 1) \| ((low >> (k + 15)) & 2);
				197	int delta = table[offset];
				198	etc1_byte* q = pOut + 3 * (x + 4 * y);
				199	*q++ = clamp(r + delta);
				200	*q++ = clamp(g + delta);
				201	*q++ = clamp(b + delta);
				202	}
				203	}
				204
				205	// Input is an ETC1 compressed version of the data.
				206	// Output is a 4 x 4 square of 3-byte pixels in form R, G, B
				207
				208	void etc1_decode_block(const etc1_byte* pIn, etc1_byte* pOut) {
				209	etc1_uint32 high = (pIn[0] << 24) \| (pIn[1] << 16) \| (pIn[2] << 8) \| pIn[3];
				210	etc1_uint32 low = (pIn[4] << 24) \| (pIn[5] << 16) \| (pIn[6] << 8) \| pIn[7];
				211	int r1, r2, g1, g2, b1, b2;
				212	if (high & 2) {
				213	// differential
				214	int rBase = high >> 27;
				215	int gBase = high >> 19;
				216	int bBase = high >> 11;
				217	r1 = convert5To8(rBase);
				218	r2 = convertDiff(rBase, high >> 24);
				219	g1 = convert5To8(gBase);
				220	g2 = convertDiff(gBase, high >> 16);
				221	b1 = convert5To8(bBase);
				222	b2 = convertDiff(bBase, high >> 8);
				223	} else {
				224	// not differential
				225	r1 = convert4To8(high >> 28);
				226	r2 = convert4To8(high >> 24);
				227	g1 = convert4To8(high >> 20);
				228	g2 = convert4To8(high >> 16);
				229	b1 = convert4To8(high >> 12);
				230	b2 = convert4To8(high >> 8);
				231	}
				232	int tableIndexA = 7 & (high >> 5);
				233	int tableIndexB = 7 & (high >> 2);
				234	const int* tableA = kModifierTable + tableIndexA * 4;
				235	const int* tableB = kModifierTable + tableIndexB * 4;
				236	bool flipped = (high & 1) != 0;
				237	decode_subblock(pOut, r1, g1, b1, tableA, low, false, flipped);
				238	decode_subblock(pOut, r2, g2, b2, tableB, low, true, flipped);
				239	}
				240
				241	typedef struct {
				242	etc1_uint32 high;
				243	etc1_uint32 low;
				244	etc1_uint32 score; // Lower is more accurate
				245	} etc_compressed;
				246
				247	static
				248	inline void take_best(etc_compressed* a, const etc_compressed* b) {
				249	if (a->score > b->score) {
				250	a = b;
				251	}
				252	}
				253
				254	static
				255	void etc_average_colors_subblock(const etc1_byte* pIn, etc1_uint32 inMask,
				256	etc1_byte* pColors, bool flipped, bool second) {
				257	int r = 0;
				258	int g = 0;
				259	int b = 0;
				260
				261	if (flipped) {
				262	int by = 0;
				263	if (second) {
				264	by = 2;
				265	}
				266	for (int y = 0; y < 2; y++) {
				267	int yy = by + y;
				268	for (int x = 0; x < 4; x++) {
				269	int i = x + 4 * yy;
				270	if (inMask & (1 << i)) {
				271	const etc1_byte* p = pIn + i * 3;
				272	r += *(p++);
				273	g += *(p++);
				274	b += *(p++);
				275	}
				276	}
				277	}
				278	} else {
				279	int bx = 0;
				280	if (second) {
				281	bx = 2;
				282	}
				283	for (int y = 0; y < 4; y++) {
				284	for (int x = 0; x < 2; x++) {
				285	int xx = bx + x;
				286	int i = xx + 4 * y;
				287	if (inMask & (1 << i)) {
				288	const etc1_byte* p = pIn + i * 3;
				289	r += *(p++);
				290	g += *(p++);
				291	b += *(p++);
				292	}
				293	}
				294	}
				295	}
				296	pColors[0] = (etc1_byte)((r + 4) >> 3);
				297	pColors[1] = (etc1_byte)((g + 4) >> 3);
				298	pColors[2] = (etc1_byte)((b + 4) >> 3);
				299	}
				300
				301	static
				302	inline int square(int x) {
				303	return x * x;
				304	}
				305
				306	static etc1_uint32 chooseModifier(const etc1_byte* pBaseColors,
				307	const etc1_byte* pIn, etc1_uint32 *pLow, int bitIndex,
				308	const int* pModifierTable) {
				309	etc1_uint32 bestScore = ~0;
				310	int bestIndex = 0;
				311	int pixelR = pIn[0];
				312	int pixelG = pIn[1];
				313	int pixelB = pIn[2];
				314	int r = pBaseColors[0];
				315	int g = pBaseColors[1];
				316	int b = pBaseColors[2];
				317	for (int i = 0; i < 4; i++) {
				318	int modifier = pModifierTable[i];
				319	int decodedG = clamp(g + modifier);
				320	etc1_uint32 score = (etc1_uint32) (6 * square(decodedG - pixelG));
				321	if (score >= bestScore) {
				322	continue;
				323	}
				324	int decodedR = clamp(r + modifier);
				325	score += (etc1_uint32) (3 * square(decodedR - pixelR));
				326	if (score >= bestScore) {
				327	continue;
				328	}
				329	int decodedB = clamp(b + modifier);
				330	score += (etc1_uint32) square(decodedB - pixelB);
				331	if (score < bestScore) {
				332	bestScore = score;
				333	bestIndex = i;
				334	}
				335	}
				336	etc1_uint32 lowMask = (((bestIndex >> 1) << 16) \| (bestIndex & 1))
				337	<< bitIndex;
				338	*pLow \|= lowMask;
				339	return bestScore;
				340	}
				341
				342	static
				343	void etc_encode_subblock_helper(const etc1_byte* pIn, etc1_uint32 inMask,
				344	etc_compressed* pCompressed, bool flipped, bool second,
				345	const etc1_byte* pBaseColors, const int* pModifierTable) {
				346	int score = pCompressed->score;
				347	if (flipped) {
				348	int by = 0;
				349	if (second) {
				350	by = 2;
				351	}
				352	for (int y = 0; y < 2; y++) {
				353	int yy = by + y;
				354	for (int x = 0; x < 4; x++) {
				355	int i = x + 4 * yy;
				356	if (inMask & (1 << i)) {
				357	score += chooseModifier(pBaseColors, pIn + i * 3,
				358	&pCompressed->low, yy + x * 4, pModifierTable);
				359	}
				360	}
				361	}
				362	} else {
				363	int bx = 0;
				364	if (second) {
				365	bx = 2;
				366	}
				367	for (int y = 0; y < 4; y++) {
				368	for (int x = 0; x < 2; x++) {
				369	int xx = bx + x;
				370	int i = xx + 4 * y;
				371	if (inMask & (1 << i)) {
				372	score += chooseModifier(pBaseColors, pIn + i * 3,
				373	&pCompressed->low, y + xx * 4, pModifierTable);
				374	}
				375	}
				376	}
				377	}
				378	pCompressed->score = score;
				379	}
				380
				381	static bool inRange4bitSigned(int color) {
				382	return color >= -4 && color <= 3;
				383	}
				384
				385	static void etc_encodeBaseColors(etc1_byte* pBaseColors,
				386	const etc1_byte* pColors, etc_compressed* pCompressed) {
				387	int r1, g1, b1, r2, g2, b2; // 8 bit base colors for sub-blocks
				388	bool differential;
				389	{
				390	int r51 = convert8To5(pColors[0]);
				391	int g51 = convert8To5(pColors[1]);
				392	int b51 = convert8To5(pColors[2]);
				393	int r52 = convert8To5(pColors[3]);
				394	int g52 = convert8To5(pColors[4]);
				395	int b52 = convert8To5(pColors[5]);
				396
				397	r1 = convert5To8(r51);
				398	g1 = convert5To8(g51);
				399	b1 = convert5To8(b51);
				400
				401	int dr = r52 - r51;
				402	int dg = g52 - g51;
				403	int db = b52 - b51;
				404
				405	differential = inRange4bitSigned(dr) && inRange4bitSigned(dg)
				406	&& inRange4bitSigned(db);
				407	if (differential) {
				408	r2 = convert5To8(r51 + dr);
				409	g2 = convert5To8(g51 + dg);
				410	b2 = convert5To8(b51 + db);
				411	pCompressed->high \|= (r51 << 27) \| ((7 & dr) << 24) \| (g51 << 19)
				412	\| ((7 & dg) << 16) \| (b51 << 11) \| ((7 & db) << 8) \| 2;
				413	}
				414	}
				415
				416	if (!differential) {
				417	int r41 = convert8To4(pColors[0]);
				418	int g41 = convert8To4(pColors[1]);
				419	int b41 = convert8To4(pColors[2]);
				420	int r42 = convert8To4(pColors[3]);
				421	int g42 = convert8To4(pColors[4]);
				422	int b42 = convert8To4(pColors[5]);
				423	r1 = convert4To8(r41);
				424	g1 = convert4To8(g41);
				425	b1 = convert4To8(b41);
				426	r2 = convert4To8(r42);
				427	g2 = convert4To8(g42);
				428	b2 = convert4To8(b42);
				429	pCompressed->high \|= (r41 << 28) \| (r42 << 24) \| (g41 << 20) \| (g42
				430	<< 16) \| (b41 << 12) \| (b42 << 8);
				431	}
				432	pBaseColors[0] = r1;
				433	pBaseColors[1] = g1;
				434	pBaseColors[2] = b1;
				435	pBaseColors[3] = r2;
				436	pBaseColors[4] = g2;
				437	pBaseColors[5] = b2;
				438	}
				439
				440	static
				441	void etc_encode_block_helper(const etc1_byte* pIn, etc1_uint32 inMask,
				442	const etc1_byte* pColors, etc_compressed* pCompressed, bool flipped) {
				443	pCompressed->score = ~0;
				444	pCompressed->high = (flipped ? 1 : 0);
				445	pCompressed->low = 0;
				446
				447	etc1_byte pBaseColors[6];
				448
				449	etc_encodeBaseColors(pBaseColors, pColors, pCompressed);
				450
				451	int originalHigh = pCompressed->high;
				452
				453	const int* pModifierTable = kModifierTable;
				454	for (int i = 0; i < 8; i++, pModifierTable += 4) {
				455	etc_compressed temp;
				456	temp.score = 0;
				457	temp.high = originalHigh \| (i << 5);
				458	temp.low = 0;
				459	etc_encode_subblock_helper(pIn, inMask, &temp, flipped, false,
				460	pBaseColors, pModifierTable);
				461	take_best(pCompressed, &temp);
				462	}
				463	pModifierTable = kModifierTable;
				464	etc_compressed firstHalf = *pCompressed;
				465	for (int i = 0; i < 8; i++, pModifierTable += 4) {
				466	etc_compressed temp;
				467	temp.score = firstHalf.score;
				468	temp.high = firstHalf.high \| (i << 2);
				469	temp.low = firstHalf.low;
				470	etc_encode_subblock_helper(pIn, inMask, &temp, flipped, true,
				471	pBaseColors + 3, pModifierTable);
				472	if (i == 0) {
				473	*pCompressed = temp;
				474	} else {
				475	take_best(pCompressed, &temp);
				476	}
				477	}
				478	}
				479
				480	static void writeBigEndian(etc1_byte* pOut, etc1_uint32 d) {
				481	pOut[0] = (etc1_byte)(d >> 24);
				482	pOut[1] = (etc1_byte)(d >> 16);
				483	pOut[2] = (etc1_byte)(d >> 8);
				484	pOut[3] = (etc1_byte) d;
				485	}
				486
				487	// Input is a 4 x 4 square of 3-byte pixels in form R, G, B
				488	// inmask is a 16-bit mask where bit (1 << (x + y * 4)) tells whether the corresponding (x,y)
				489	// pixel is valid or not. Invalid pixel color values are ignored when compressing.
				490	// Output is an ETC1 compressed version of the data.
				491
				492	void etc1_encode_block(const etc1_byte* pIn, etc1_uint32 inMask,
				493	etc1_byte* pOut) {
				494	etc1_byte colors[6];
				495	etc1_byte flippedColors[6];
				496	etc_average_colors_subblock(pIn, inMask, colors, false, false);
				497	etc_average_colors_subblock(pIn, inMask, colors + 3, false, true);
				498	etc_average_colors_subblock(pIn, inMask, flippedColors, true, false);
				499	etc_average_colors_subblock(pIn, inMask, flippedColors + 3, true, true);
				500
				501	etc_compressed a, b;
				502	etc_encode_block_helper(pIn, inMask, colors, &a, false);
				503	etc_encode_block_helper(pIn, inMask, flippedColors, &b, true);
				504	take_best(&a, &b);
				505	writeBigEndian(pOut, a.high);
				506	writeBigEndian(pOut + 4, a.low);
				507	}
				508
				509	// Return the size of the encoded image data (does not include size of PKM header).
				510
				511	etc1_uint32 etc1_get_encoded_data_size(etc1_uint32 width, etc1_uint32 height) {
				512	return (((width + 3) & ~3) * ((height + 3) & ~3)) >> 1;
				513	}
				514
				515	// Encode an entire image.
				516	// pIn - pointer to the image data. Formatted such that the Red component of
				517	// pixel (x,y) is at pIn + pixelSize * x + stride * y + redOffset;
				518	// pOut - pointer to encoded data. Must be large enough to store entire encoded image.
				519
				520	int etc1_encode_image(const etc1_byte* pIn, etc1_uint32 width, etc1_uint32 height,
				521	etc1_uint32 pixelSize, etc1_uint32 stride, etc1_byte* pOut) {
				522	if (pixelSize < 2 \|\| pixelSize > 3) {
				523	return -1;
				524	}
				525	static const unsigned short kYMask[] = { 0x0, 0xf, 0xff, 0xfff, 0xffff };
				526	static const unsigned short kXMask[] = { 0x0, 0x1111, 0x3333, 0x7777,
				527	0xffff };
				528	etc1_byte block[ETC1_DECODED_BLOCK_SIZE];
				529	etc1_byte encoded[ETC1_ENCODED_BLOCK_SIZE];
				530
				531	etc1_uint32 encodedWidth = (width + 3) & ~3;
				532	etc1_uint32 encodedHeight = (height + 3) & ~3;
				533
				534	for (etc1_uint32 y = 0; y < encodedHeight; y += 4) {
				535	etc1_uint32 yEnd = height - y;
				536	if (yEnd > 4) {
				537	yEnd = 4;
				538	}
				539	int ymask = kYMask[yEnd];
				540	for (etc1_uint32 x = 0; x < encodedWidth; x += 4) {
				541	etc1_uint32 xEnd = width - x;
				542	if (xEnd > 4) {
				543	xEnd = 4;
				544	}
				545	int mask = ymask & kXMask[xEnd];
				546	for (etc1_uint32 cy = 0; cy < yEnd; cy++) {
				547	etc1_byte* q = block + (cy * 4) * 3;
				548	const etc1_byte* p = pIn + pixelSize * x + stride * (y + cy);
				549	if (pixelSize == 3) {
				550	memcpy(q, p, xEnd * 3);
				551	} else {
				552	for (etc1_uint32 cx = 0; cx < xEnd; cx++) {
				553	int pixel = (p[1] << 8) \| p[0];
				554	*q++ = convert5To8(pixel >> 11);
				555	*q++ = convert6To8(pixel >> 5);
				556	*q++ = convert5To8(pixel);
				557	p += pixelSize;
				558	}
				559	}
				560	}
				561	etc1_encode_block(block, mask, encoded);
				562	memcpy(pOut, encoded, sizeof(encoded));
				563	pOut += sizeof(encoded);
				564	}
				565	}
				566	return 0;
				567	}
				568
				569	// Decode an entire image.
				570	// pIn - pointer to encoded data.
				571	// pOut - pointer to the image data. Will be written such that the Red component of
				572	// pixel (x,y) is at pIn + pixelSize * x + stride * y + redOffset. Must be
				573	// large enough to store entire image.
				574
				575
				576	int etc1_decode_image(const etc1_byte* pIn, etc1_byte* pOut,
				577	etc1_uint32 width, etc1_uint32 height,
				578	etc1_uint32 pixelSize, etc1_uint32 stride) {
				579	if (pixelSize < 2 \|\| pixelSize > 3) {
				580	return -1;
				581	}
				582	etc1_byte block[ETC1_DECODED_BLOCK_SIZE];
				583
				584	etc1_uint32 encodedWidth = (width + 3) & ~3;
				585	etc1_uint32 encodedHeight = (height + 3) & ~3;
				586
				587	for (etc1_uint32 y = 0; y < encodedHeight; y += 4) {
				588	etc1_uint32 yEnd = height - y;
				589	if (yEnd > 4) {
				590	yEnd = 4;
				591	}
				592	for (etc1_uint32 x = 0; x < encodedWidth; x += 4) {
				593	etc1_uint32 xEnd = width - x;
				594	if (xEnd > 4) {
				595	xEnd = 4;
				596	}
				597	etc1_decode_block(pIn, block);
				598	pIn += ETC1_ENCODED_BLOCK_SIZE;
				599	for (etc1_uint32 cy = 0; cy < yEnd; cy++) {
				600	const etc1_byte* q = block + (cy * 4) * 3;
				601	etc1_byte* p = pOut + pixelSize * x + stride * (y + cy);
				602	if (pixelSize == 3) {
				603	memcpy(p, q, xEnd * 3);
				604	} else {
				605	for (etc1_uint32 cx = 0; cx < xEnd; cx++) {
				606	etc1_byte r = *q++;
				607	etc1_byte g = *q++;
				608	etc1_byte b = *q++;
				609	etc1_uint32 pixel = ((r >> 3) << 11) \| ((g >> 2) << 5) \| (b >> 3);
				610	*p++ = (etc1_byte) pixel;
				611	*p++ = (etc1_byte) (pixel >> 8);
				612	}
				613	}
				614	}
				615	}
				616	}
				617	return 0;
				618	}
				619
				620	static const char kMagic[] = { 'P', 'K', 'M', ' ', '1', '0' };
				621
				622	static const etc1_uint32 ETC1_PKM_FORMAT_OFFSET = 6;
				623	static const etc1_uint32 ETC1_PKM_ENCODED_WIDTH_OFFSET = 8;
				624	static const etc1_uint32 ETC1_PKM_ENCODED_HEIGHT_OFFSET = 10;
				625	static const etc1_uint32 ETC1_PKM_WIDTH_OFFSET = 12;
				626	static const etc1_uint32 ETC1_PKM_HEIGHT_OFFSET = 14;
				627
				628	static const etc1_uint32 ETC1_RGB_NO_MIPMAPS = 0;
				629
				630	static void writeBEUint16(etc1_byte* pOut, etc1_uint32 data) {
				631	pOut[0] = (etc1_byte) (data >> 8);
				632	pOut[1] = (etc1_byte) data;
				633	}
				634
				635	static etc1_uint32 readBEUint16(const etc1_byte* pIn) {
				636	return (pIn[0] << 8) \| pIn[1];
				637	}
				638
				639	// Format a PKM header
				640
				641	void etc1_pkm_format_header(etc1_byte* pHeader, etc1_uint32 width, etc1_uint32 height) {
				642	memcpy(pHeader, kMagic, sizeof(kMagic));
				643	etc1_uint32 encodedWidth = (width + 3) & ~3;
				644	etc1_uint32 encodedHeight = (height + 3) & ~3;
				645	writeBEUint16(pHeader + ETC1_PKM_FORMAT_OFFSET, ETC1_RGB_NO_MIPMAPS);
				646	writeBEUint16(pHeader + ETC1_PKM_ENCODED_WIDTH_OFFSET, encodedWidth);
				647	writeBEUint16(pHeader + ETC1_PKM_ENCODED_HEIGHT_OFFSET, encodedHeight);
				648	writeBEUint16(pHeader + ETC1_PKM_WIDTH_OFFSET, width);
				649	writeBEUint16(pHeader + ETC1_PKM_HEIGHT_OFFSET, height);
				650	}
				651
				652	// Check if a PKM header is correctly formatted.
				653
				654	etc1_bool etc1_pkm_is_valid(const etc1_byte* pHeader) {
				655	if (memcmp(pHeader, kMagic, sizeof(kMagic))) {
				656	return false;
				657	}
				658	etc1_uint32 format = readBEUint16(pHeader + ETC1_PKM_FORMAT_OFFSET);
				659	etc1_uint32 encodedWidth = readBEUint16(pHeader + ETC1_PKM_ENCODED_WIDTH_OFFSET);
				660	etc1_uint32 encodedHeight = readBEUint16(pHeader + ETC1_PKM_ENCODED_HEIGHT_OFFSET);
				661	etc1_uint32 width = readBEUint16(pHeader + ETC1_PKM_WIDTH_OFFSET);
				662	etc1_uint32 height = readBEUint16(pHeader + ETC1_PKM_HEIGHT_OFFSET);
				663	return format == ETC1_RGB_NO_MIPMAPS &&
				664	encodedWidth >= width && encodedWidth - width < 4 &&
				665	encodedHeight >= height && encodedHeight - height < 4;
				666	}
				667
				668	// Read the image width from a PKM header
				669
				670	etc1_uint32 etc1_pkm_get_width(const etc1_byte* pHeader) {
				671	return readBEUint16(pHeader + ETC1_PKM_WIDTH_OFFSET);
				672	}
				673
				674	// Read the image height from a PKM header
				675
				676	etc1_uint32 etc1_pkm_get_height(const etc1_byte* pHeader){
				677	return readBEUint16(pHeader + ETC1_PKM_HEIGHT_OFFSET);
				678	}