nir_lower_drsq = (1 << 2),
nir_lower_dtrunc = (1 << 3),
nir_lower_dfloor = (1 << 4),
+ nir_lower_dceil = (1 << 5),
} nir_lower_doubles_options;
void nir_lower_doubles(nir_shader *shader, nir_lower_doubles_options options);
nir_fsub(b, tr, nir_imm_double(b, 1.0)));
}
+static nir_ssa_def *
+lower_ceil(nir_builder *b, nir_ssa_def *src)
+{
+ /* if x < 0, ceil(x) = trunc(x)
+ * else if (x - trunc(x) == 0), ceil(x) = x
+ * else, ceil(x) = trunc(x) + 1
+ */
+ nir_ssa_def *tr = nir_ftrunc(b, src);
+ nir_ssa_def *negative = nir_flt(b, src, nir_imm_double(b, 0.0));
+ return nir_bcsel(b,
+ nir_ior(b, negative, nir_feq(b, src, tr)),
+ tr,
+ nir_fadd(b, tr, nir_imm_double(b, 1.0)));
+}
+
static void
lower_doubles_instr(nir_alu_instr *instr, nir_lower_doubles_options options)
{
return;
break;
+ case nir_op_fceil:
+ if (!(options & nir_lower_dceil))
+ return;
+ break;
+
default:
return;
}
case nir_op_ffloor:
result = lower_floor(&bld, src);
break;
+ case nir_op_fceil:
+ result = lower_ceil(&bld, src);
+ break;
default:
unreachable("unhandled opcode");
}