Blame - src/compiler/translator/EmulatePrecision.cpp - platform/external/angle

blob: a4cb028a7f4140d3fe008d354bf6ddcd96bd9287 [file] [log] [blame]

Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	1	//
				2	// Copyright (c) 2002-2014 The ANGLE Project Authors. All rights reserved.
				3	// Use of this source code is governed by a BSD-style license that can be
				4	// found in the LICENSE file.
				5	//
				6
				7	#include "compiler/translator/EmulatePrecision.h"
				8
				9	namespace
				10	{
				11
				12	static void writeVectorPrecisionEmulationHelpers(
				13	TInfoSinkBase& sink, ShShaderOutput outputLanguage, unsigned int size)
				14	{
				15	std::stringstream vecTypeStrStr;
				16	if (outputLanguage == SH_ESSL_OUTPUT)
				17	vecTypeStrStr << "highp ";
				18	vecTypeStrStr << "vec" << size;
				19	std::string vecType = vecTypeStrStr.str();
				20
				21	sink <<
				22	vecType << " angle_frm(in " << vecType << " v) {\n"
				23	" v = clamp(v, -65504.0, 65504.0);\n"
				24	" " << vecType << " exponent = floor(log2(abs(v) + 1e-30)) - 10.0;\n"
				25	" bvec" << size << " isNonZero = greaterThanEqual(exponent, vec" << size << "(-25.0));\n"
				26	" v = v * exp2(-exponent);\n"
				27	" v = sign(v) * floor(abs(v));\n"
				28	" return v * exp2(exponent) * vec" << size << "(isNonZero);\n"
				29	"}\n";
				30
				31	sink <<
				32	vecType << " angle_frl(in " << vecType << " v) {\n"
				33	" v = clamp(v, -2.0, 2.0);\n"
				34	" v = v * 256.0;\n"
				35	" v = sign(v) * floor(abs(v));\n"
				36	" return v * 0.00390625;\n"
				37	"}\n";
				38	}
				39
				40	static void writeMatrixPrecisionEmulationHelper(
				41	TInfoSinkBase& sink, ShShaderOutput outputLanguage, unsigned int size, const char *functionName)
				42	{
				43	std::stringstream matTypeStrStr;
				44	if (outputLanguage == SH_ESSL_OUTPUT)
				45	matTypeStrStr << "highp ";
				46	matTypeStrStr << "mat" << size;
				47	std::string matType = matTypeStrStr.str();
				48
				49	sink << matType << " " << functionName << "(in " << matType << " m) {\n"
				50	" " << matType << " rounded;\n";
				51
				52	for (unsigned int i = 0; i < size; ++i)
				53	{
				54	sink << " rounded[" << i << "] = " << functionName << "(m[" << i << "]);\n";
				55	}
				56
				57	sink << " return rounded;\n"
				58	"}\n";
				59	}
				60
				61	static void writeCommonPrecisionEmulationHelpers(TInfoSinkBase& sink, ShShaderOutput outputLanguage)
				62	{
				63	// Write the angle_frm functions that round floating point numbers to
				64	// half precision, and angle_frl functions that round them to minimum lowp
				65	// precision.
				66
				67	// Unoptimized version of angle_frm for single floats:
				68	//
				69	// int webgl_maxNormalExponent(in int exponentBits) {
				70	// int possibleExponents = int(exp2(float(exponentBits)));
				71	// int exponentBias = possibleExponents / 2 - 1;
				72	// int allExponentBitsOne = possibleExponents - 1;
				73	// return (allExponentBitsOne - 1) - exponentBias;
				74	// }
				75	//
				76	// float angle_frm(in float x) {
				77	// int mantissaBits = 10;
				78	// int exponentBits = 5;
				79	// float possibleMantissas = exp2(float(mantissaBits));
				80	// float mantissaMax = 2.0 - 1.0 / possibleMantissas;
				81	// int maxNE = webgl_maxNormalExponent(exponentBits);
				82	// float max = exp2(float(maxNE)) * mantissaMax;
				83	// if (x > max) {
				84	// return max;
				85	// }
				86	// if (x < -max) {
				87	// return -max;
				88	// }
				89	// float exponent = floor(log2(abs(x)));
				90	// if (abs(x) == 0.0 \|\| exponent < -float(maxNE)) {
				91	// return 0.0 * sign(x)
				92	// }
				93	// x = x * exp2(-(exponent - float(mantissaBits)));
				94	// x = sign(x) * floor(abs(x));
				95	// return x * exp2(exponent - float(mantissaBits));
				96	// }
				97
				98	// All numbers with a magnitude less than 2^-15 are subnormal, and are
				99	// flushed to zero.
				100
				101	// Note the constant numbers below:
				102	// a) 65504 is the maximum possible mantissa (1.1111111111 in binary) times
				103	// 2^15, the maximum normal exponent.
				104	// b) 10.0 is the number of mantissa bits.
				105	// c) -25.0 is the minimum normal half-float exponent -15.0 minus the number
				106	// of mantissa bits.
				107	// d) + 1e-30 is to make sure the argument of log2() won't be zero. It can
				108	// only affect the result of log2 on x where abs(x) < 1e-22. Since these
				109	// numbers will be flushed to zero either way (2^-15 is the smallest
				110	// normal positive number), this does not introduce any error.
				111
				112	std::string floatType = "float";
				113	if (outputLanguage == SH_ESSL_OUTPUT)
				114	floatType = "highp float";
				115
				116	sink <<
				117	floatType << " angle_frm(in " << floatType << " x) {\n"
				118	" x = clamp(x, -65504.0, 65504.0);\n"
				119	" " << floatType << " exponent = floor(log2(abs(x) + 1e-30)) - 10.0;\n"
				120	" bool isNonZero = (exponent >= -25.0);\n"
				121	" x = x * exp2(-exponent);\n"
				122	" x = sign(x) * floor(abs(x));\n"
				123	" return x * exp2(exponent) * float(isNonZero);\n"
				124	"}\n";
				125
				126	sink <<
				127	floatType << " angle_frl(in " << floatType << " x) {\n"
				128	" x = clamp(x, -2.0, 2.0);\n"
				129	" x = x * 256.0;\n"
				130	" x = sign(x) * floor(abs(x));\n"
				131	" return x * 0.00390625;\n"
				132	"}\n";
				133
				134	writeVectorPrecisionEmulationHelpers(sink, outputLanguage, 2);
				135	writeVectorPrecisionEmulationHelpers(sink, outputLanguage, 3);
				136	writeVectorPrecisionEmulationHelpers(sink, outputLanguage, 4);
				137	for (unsigned int size = 2; size <= 4; ++size)
				138	{
				139	writeMatrixPrecisionEmulationHelper(sink, outputLanguage, size, "angle_frm");
				140	writeMatrixPrecisionEmulationHelper(sink, outputLanguage, size, "angle_frl");
				141	}
				142	}
				143
				144	static void writeCompoundAssignmentPrecisionEmulation(
				145	TInfoSinkBase& sink, ShShaderOutput outputLanguage,
				146	const char lType, const char rType, const char opStr, const char opNameStr)
				147	{
				148	std::string lTypeStr = lType;
				149	std::string rTypeStr = rType;
				150	if (outputLanguage == SH_ESSL_OUTPUT)
				151	{
				152	std::stringstream lTypeStrStr;
				153	lTypeStrStr << "highp " << lType;
				154	lTypeStr = lTypeStrStr.str();
				155	std::stringstream rTypeStrStr;
				156	rTypeStrStr << "highp " << rType;
				157	rTypeStr = rTypeStrStr.str();
				158	}
				159
				160	// Note that y should be passed through angle_frm at the function call site,
				161	// but x can't be passed through angle_frm there since it is an inout parameter.
				162	// So only pass x and the result through angle_frm here.
				163	sink <<
				164	lTypeStr << " angle_compound_" << opNameStr << "_frm(inout " << lTypeStr << " x, in " << rTypeStr << " y) {\n"
				165	" x = angle_frm(angle_frm(x) " << opStr << " y);\n"
				166	" return x;\n"
				167	"}\n";
				168	sink <<
				169	lTypeStr << " angle_compound_" << opNameStr << "_frl(inout " << lTypeStr << " x, in " << rTypeStr << " y) {\n"
				170	" x = angle_frl(angle_frm(x) " << opStr << " y);\n"
				171	" return x;\n"
				172	"}\n";
				173	}
				174
				175	const char *getFloatTypeStr(const TType& type)
				176	{
				177	switch (type.getNominalSize())
				178	{
				179	case 1:
				180	return "float";
				181	case 2:
Alexis Hetu	07e57df	2015-06-16 16:55:52 -0400	[diff] [blame]	182	switch(type.getSecondarySize())
				183	{
				184	case 1:
				185	return "vec2";
				186	case 2:
				187	return "mat2";
				188	case 3:
				189	return "mat2x3";
				190	case 4:
				191	return "mat2x4";
				192	default:
				193	UNREACHABLE();
				194	return NULL;
				195	}
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	196	case 3:
Alexis Hetu	07e57df	2015-06-16 16:55:52 -0400	[diff] [blame]	197	switch(type.getSecondarySize())
				198	{
				199	case 1:
				200	return "vec3";
				201	case 2:
				202	return "mat3x2";
				203	case 3:
				204	return "mat3";
				205	case 4:
				206	return "mat3x4";
				207	default:
				208	UNREACHABLE();
				209	return NULL;
				210	}
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	211	case 4:
Alexis Hetu	07e57df	2015-06-16 16:55:52 -0400	[diff] [blame]	212	switch(type.getSecondarySize())
				213	{
				214	case 1:
				215	return "vec4";
				216	case 2:
				217	return "mat4x2";
				218	case 3:
				219	return "mat4x3";
				220	case 4:
				221	return "mat4";
				222	default:
				223	UNREACHABLE();
				224	return NULL;
				225	}
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	226	default:
				227	UNREACHABLE();
				228	return NULL;
				229	}
				230	}
				231
				232	bool canRoundFloat(const TType &type)
				233	{
				234	return type.getBasicType() == EbtFloat && !type.isNonSquareMatrix() && !type.isArray() &&
				235	(type.getPrecision() == EbpLow \|\| type.getPrecision() == EbpMedium);
				236	}
				237
				238	TIntermAggregate createInternalFunctionCallNode(TString name, TIntermNode child)
				239	{
				240	TIntermAggregate *callNode = new TIntermAggregate();
				241	callNode->setOp(EOpInternalFunctionCall);
				242	callNode->setName(name);
				243	callNode->getSequence()->push_back(child);
				244	return callNode;
				245	}
				246
				247	TIntermAggregate createRoundingFunctionCallNode(TIntermTyped roundedChild)
				248	{
				249	TString roundFunctionName;
				250	if (roundedChild->getPrecision() == EbpMedium)
				251	roundFunctionName = "angle_frm";
				252	else
				253	roundFunctionName = "angle_frl";
				254	return createInternalFunctionCallNode(roundFunctionName, roundedChild);
				255	}
				256
				257	TIntermAggregate createCompoundAssignmentFunctionCallNode(TIntermTyped left, TIntermTyped right, const char opNameStr)
				258	{
				259	std::stringstream strstr;
				260	if (left->getPrecision() == EbpMedium)
				261	strstr << "angle_compound_" << opNameStr << "_frm";
				262	else
				263	strstr << "angle_compound_" << opNameStr << "_frl";
				264	TString functionName = strstr.str().c_str();
				265	TIntermAggregate *callNode = createInternalFunctionCallNode(functionName, left);
				266	callNode->getSequence()->push_back(right);
				267	return callNode;
				268	}
				269
Olli Etuaho	1be8870	2015-01-19 16:56:44 +0200	[diff] [blame]	270	bool parentUsesResult(TIntermNode* parent, TIntermNode* node)
				271	{
				272	if (!parent)
				273	{
				274	return false;
				275	}
				276
				277	TIntermAggregate *aggParent = parent->getAsAggregate();
				278	// If the parent's op is EOpSequence, the result is not assigned anywhere,
				279	// so rounding it is not needed. In particular, this can avoid a lot of
				280	// unnecessary rounding of unused return values of assignment.
				281	if (aggParent && aggParent->getOp() == EOpSequence)
				282	{
				283	return false;
				284	}
				285	if (aggParent && aggParent->getOp() == EOpComma && (aggParent->getSequence()->back() != node))
				286	{
				287	return false;
				288	}
				289	return true;
				290	}
				291
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	292	} // namespace anonymous
				293
				294	EmulatePrecision::EmulatePrecision()
Olli Etuaho	3fc9337	2015-08-11 14:50:59 +0300	[diff] [blame^]	295	: TLValueTrackingTraverser(true, true, true), mDeclaringVariables(false)
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	296	{}
				297
				298	void EmulatePrecision::visitSymbol(TIntermSymbol *node)
				299	{
Olli Etuaho	a26ad58	2015-08-04 13:51:47 +0300	[diff] [blame]	300	if (canRoundFloat(node->getType()) && !mDeclaringVariables && !isLValueRequiredHere())
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	301	{
				302	TIntermNode *parent = getParentNode();
				303	TIntermNode *replacement = createRoundingFunctionCallNode(node);
				304	mReplacements.push_back(NodeUpdateEntry(parent, node, replacement, true));
				305	}
				306	}
				307
				308
				309	bool EmulatePrecision::visitBinary(Visit visit, TIntermBinary *node)
				310	{
				311	bool visitChildren = true;
				312
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	313	TOperator op = node->getOp();
				314
				315	// RHS of initialize is not being declared.
				316	if (op == EOpInitialize && visit == InVisit)
				317	mDeclaringVariables = false;
				318
				319	if ((op == EOpIndexDirectStruct \|\| op == EOpVectorSwizzle) && visit == InVisit)
				320	visitChildren = false;
				321
				322	if (visit != PreVisit)
				323	return visitChildren;
				324
				325	const TType& type = node->getType();
				326	bool roundFloat = canRoundFloat(type);
				327
				328	if (roundFloat) {
				329	switch (op) {
				330	// Math operators that can result in a float may need to apply rounding to the return
				331	// value. Note that in the case of assignment, the rounding is applied to its return
				332	// value here, not the value being assigned.
				333	case EOpAssign:
				334	case EOpAdd:
				335	case EOpSub:
				336	case EOpMul:
				337	case EOpDiv:
				338	case EOpVectorTimesScalar:
				339	case EOpVectorTimesMatrix:
				340	case EOpMatrixTimesVector:
				341	case EOpMatrixTimesScalar:
				342	case EOpMatrixTimesMatrix:
				343	{
				344	TIntermNode *parent = getParentNode();
Olli Etuaho	1be8870	2015-01-19 16:56:44 +0200	[diff] [blame]	345	if (!parentUsesResult(parent, node))
				346	{
				347	break;
				348	}
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	349	TIntermNode *replacement = createRoundingFunctionCallNode(node);
				350	mReplacements.push_back(NodeUpdateEntry(parent, node, replacement, true));
				351	break;
				352	}
				353
				354	// Compound assignment cases need to replace the operator with a function call.
				355	case EOpAddAssign:
				356	{
				357	mEmulateCompoundAdd.insert(TypePair(getFloatTypeStr(type), getFloatTypeStr(node->getRight()->getType())));
				358	TIntermNode *parent = getParentNode();
				359	TIntermNode *replacement = createCompoundAssignmentFunctionCallNode(node->getLeft(), node->getRight(), "add");
				360	mReplacements.push_back(NodeUpdateEntry(parent, node, replacement, false));
				361	break;
				362	}
				363	case EOpSubAssign:
				364	{
				365	mEmulateCompoundSub.insert(TypePair(getFloatTypeStr(type), getFloatTypeStr(node->getRight()->getType())));
				366	TIntermNode *parent = getParentNode();
				367	TIntermNode *replacement = createCompoundAssignmentFunctionCallNode(node->getLeft(), node->getRight(), "sub");
				368	mReplacements.push_back(NodeUpdateEntry(parent, node, replacement, false));
				369	break;
				370	}
				371	case EOpMulAssign:
				372	case EOpVectorTimesMatrixAssign:
				373	case EOpVectorTimesScalarAssign:
				374	case EOpMatrixTimesScalarAssign:
				375	case EOpMatrixTimesMatrixAssign:
				376	{
				377	mEmulateCompoundMul.insert(TypePair(getFloatTypeStr(type), getFloatTypeStr(node->getRight()->getType())));
				378	TIntermNode *parent = getParentNode();
				379	TIntermNode *replacement = createCompoundAssignmentFunctionCallNode(node->getLeft(), node->getRight(), "mul");
				380	mReplacements.push_back(NodeUpdateEntry(parent, node, replacement, false));
				381	break;
				382	}
				383	case EOpDivAssign:
				384	{
				385	mEmulateCompoundDiv.insert(TypePair(getFloatTypeStr(type), getFloatTypeStr(node->getRight()->getType())));
				386	TIntermNode *parent = getParentNode();
				387	TIntermNode *replacement = createCompoundAssignmentFunctionCallNode(node->getLeft(), node->getRight(), "div");
				388	mReplacements.push_back(NodeUpdateEntry(parent, node, replacement, false));
				389	break;
				390	}
				391	default:
				392	// The rest of the binary operations should not need precision emulation.
				393	break;
				394	}
				395	}
				396	return visitChildren;
				397	}
				398
				399	bool EmulatePrecision::visitAggregate(Visit visit, TIntermAggregate *node)
				400	{
				401	bool visitChildren = true;
				402	switch (node->getOp())
				403	{
				404	case EOpSequence:
				405	case EOpConstructStruct:
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	406	case EOpFunction:
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	407	break;
				408	case EOpPrototype:
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	409	visitChildren = false;
				410	break;
				411	case EOpParameters:
				412	visitChildren = false;
				413	break;
				414	case EOpInvariantDeclaration:
				415	visitChildren = false;
				416	break;
				417	case EOpDeclaration:
				418	// Variable declaration.
				419	if (visit == PreVisit)
				420	{
				421	mDeclaringVariables = true;
				422	}
				423	else if (visit == InVisit)
				424	{
				425	mDeclaringVariables = true;
				426	}
				427	else
				428	{
				429	mDeclaringVariables = false;
				430	}
				431	break;
				432	case EOpFunctionCall:
				433	{
				434	// Function call.
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	435	if (visit == PreVisit)
				436	{
Olli Etuaho	1be8870	2015-01-19 16:56:44 +0200	[diff] [blame]	437	// User-defined function return values are not rounded, this relies on that
				438	// calculations producing the value were rounded.
				439	TIntermNode *parent = getParentNode();
Olli Etuaho	a26ad58	2015-08-04 13:51:47 +0300	[diff] [blame]	440	if (canRoundFloat(node->getType()) && !isInFunctionMap(node) &&
				441	parentUsesResult(parent, node))
Olli Etuaho	1be8870	2015-01-19 16:56:44 +0200	[diff] [blame]	442	{
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	443	TIntermNode *replacement = createRoundingFunctionCallNode(node);
				444	mReplacements.push_back(NodeUpdateEntry(parent, node, replacement, true));
				445	}
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	446	}
				447	break;
				448	}
				449	default:
Olli Etuaho	1be8870	2015-01-19 16:56:44 +0200	[diff] [blame]	450	TIntermNode *parent = getParentNode();
				451	if (canRoundFloat(node->getType()) && visit == PreVisit && parentUsesResult(parent, node))
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	452	{
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	453	TIntermNode *replacement = createRoundingFunctionCallNode(node);
				454	mReplacements.push_back(NodeUpdateEntry(parent, node, replacement, true));
				455	}
				456	break;
				457	}
				458	return visitChildren;
				459	}
				460
				461	bool EmulatePrecision::visitUnary(Visit visit, TIntermUnary *node)
				462	{
				463	switch (node->getOp())
				464	{
				465	case EOpNegative:
				466	case EOpVectorLogicalNot:
				467	case EOpLogicalNot:
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	468	case EOpPostIncrement:
				469	case EOpPostDecrement:
				470	case EOpPreIncrement:
				471	case EOpPreDecrement:
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	472	break;
				473	default:
				474	if (canRoundFloat(node->getType()) && visit == PreVisit)
				475	{
				476	TIntermNode *parent = getParentNode();
				477	TIntermNode *replacement = createRoundingFunctionCallNode(node);
				478	mReplacements.push_back(NodeUpdateEntry(parent, node, replacement, true));
				479	}
				480	break;
				481	}
				482
				483	return true;
				484	}
				485
				486	void EmulatePrecision::writeEmulationHelpers(TInfoSinkBase& sink, ShShaderOutput outputLanguage)
				487	{
				488	// Other languages not yet supported
Zhenyao Mo	05b6b7f	2015-03-02 17:08:09 -0800	[diff] [blame]	489	ASSERT(outputLanguage == SH_GLSL_COMPATIBILITY_OUTPUT \|\|
Qingqing Deng	ad0d079	2015-04-08 14:25:06 -0700	[diff] [blame]	490	IsGLSL130OrNewer(outputLanguage) \|\|
Zhenyao Mo	05b6b7f	2015-03-02 17:08:09 -0800	[diff] [blame]	491	outputLanguage == SH_ESSL_OUTPUT);
Olli Etuaho	853dc1a	2014-11-06 17:25:48 +0200	[diff] [blame]	492	writeCommonPrecisionEmulationHelpers(sink, outputLanguage);
				493
				494	EmulationSet::const_iterator it;
				495	for (it = mEmulateCompoundAdd.begin(); it != mEmulateCompoundAdd.end(); it++)
				496	writeCompoundAssignmentPrecisionEmulation(sink, outputLanguage, it->lType, it->rType, "+", "add");
				497	for (it = mEmulateCompoundSub.begin(); it != mEmulateCompoundSub.end(); it++)
				498	writeCompoundAssignmentPrecisionEmulation(sink, outputLanguage, it->lType, it->rType, "-", "sub");
				499	for (it = mEmulateCompoundDiv.begin(); it != mEmulateCompoundDiv.end(); it++)
				500	writeCompoundAssignmentPrecisionEmulation(sink, outputLanguage, it->lType, it->rType, "/", "div");
				501	for (it = mEmulateCompoundMul.begin(); it != mEmulateCompoundMul.end(); it++)
				502	writeCompoundAssignmentPrecisionEmulation(sink, outputLanguage, it->lType, it->rType, "*", "mul");
				503	}
				504