q.c

/* Project: Q-Number (Q16.16, signed) library
 * Author:  Richard James Howe
 * License: The Unlicense
 * Email:   howe.r.j.89@gmail.com
 * Repo:    <https://github.com/q> 
 *
 *
 * A Q32.32 version would be useful. 
 *
 * The following should be changed/done for this library:
 *
 * - Moving towards a header-only model.
 * - Removal of dependencies such as 'isalpha', 'tolower'
 *   as they are locale dependent.
 * - Make components optional (filters, expression parser, ...)
 * - Make hyperbolic arc sin/cos/tan functions.
 * - Fix bugs / inaccuracies in CORDIC code.
 * - Improve accuracy of all the functions and quantify error and
 *   their limits. 
 *
 * BUG: Enter: 2.71791, get 2.0625, 2.7179 works fine. (Need to
 * limit decimal places).
 */

#include "q.h"
#include <assert.h>
#include <ctype.h>
#include <inttypes.h>
#include <limits.h>
#include <stdarg.h> /* for expression evaluator error handling */
#include <stdio.h>  /* vsnprintf, for expression evaluator */
#include <string.h>

#define UNUSED(X)               ((void)(X))
#define BOOLIFY(X)              (!!(X))
#define BUILD_BUG_ON(condition) ((void)sizeof(char[1 - 2*!!(condition)]))
#define MULTIPLIER              (INT16_MAX)
#define DMIN                    (INT32_MIN)
#define DMAX                    (INT32_MAX)
#define MIN(X, Y)               ((X) < (Y) ? (X) : (Y))
#define MAX(X, Y)               ((X) < (Y) ? (Y) : (X))

#ifndef CONFIG_Q_HIDE_FUNCS /* 1 = hide hidden (testing) functions, 0 = enable them */
#define CONFIG_Q_HIDE_FUNCS (0)
#endif

typedef  int16_t hd_t; /* half Q width,      signed */
typedef uint64_t lu_t; /* double Q width,  unsigned */

const qinfo_t qinfo = {
	.whole      = QBITS,
	.fractional = QBITS,
	.zero = (u_t)0uL << QBITS,
	.bit  = 1uL,
	.one  = (u_t)1uL << QBITS,
	.min  = (u_t)(QHIGH << QBITS),
	.max  = (u_t)((QHIGH << QBITS) - 1uL),

	.pi    = QPI, /* 3.243F6 A8885 A308D 31319 8A2E0... */
	.e     = QMK(0x2, 0xB7E1, 16), /* 2.B7E1 5162 8A... */
	.sqrt2 = QMK(0x1, 0x6A09, 16), /* 1.6A09 E667 F3... */
	.sqrt3 = QMK(0x1, 0xBB67, 16), /* 1.BB67 AE85 84... */
	.ln2   = QMK(0x0, 0xB172, 16), /* 0.B172 17F7 D1... */
	.ln10  = QMK(0x2, 0x4D76, 16), /* 2.4D76 3776 AA... */

	.version = QVERSION,
};

qconf_t qconf = { /* Global Configuration Options */
	.bound = qbound_saturate,
	.dp    = 4,
	.base  = 10,
};

/********* Basic Library Routines ********************************************/


static inline void implies(const int x, const int y) {
	assert(!x || y);
}

static inline void mutual(const int x, const int y) { /* mutual implication */
	assert(BOOLIFY(x) == BOOLIFY(y));
}

static inline void exclusive(const int x, const int y) {
	assert(BOOLIFY(x) != BOOLIFY(y));
}

static inline void static_assertions(void) {
	BUILD_BUG_ON(CHAR_BIT != 8);
	BUILD_BUG_ON((sizeof(q_t)*CHAR_BIT) != (QBITS * 2));
	BUILD_BUG_ON( sizeof(q_t) !=  sizeof(u_t));
	BUILD_BUG_ON( sizeof(u_t) !=  sizeof(d_t));
	BUILD_BUG_ON(sizeof(lu_t) !=  sizeof(ld_t));
	BUILD_BUG_ON(sizeof(d_t)  != (sizeof(hd_t) * 2));
	BUILD_BUG_ON(sizeof(lu_t) != (sizeof(u_t)  * 2));
}

q_t qbound_saturate(const ld_t s) { /**< default saturation handler */
	assert(s > DMAX || s < DMIN);
	if (s > DMAX) return DMAX;
	return DMIN;
}

q_t qbound_wrap(const ld_t s) { /**< wrap numbers on overflow */
	assert(s > DMAX || s < DMIN);
	if (s > DMAX) return DMIN + (s % DMAX);
	return DMAX - ((-s) % DMAX);
}

static inline q_t qsat(const ld_t s) {
	static_assertions();
	if (s > DMAX || s < DMIN) return qconf.bound(s);
	return s;
}

d_t arshift(const d_t v, const unsigned p) {
	u_t vn = v;
	if (v >= 0l)
		return vn >> p;
	const u_t leading = ((u_t)(-1l)) << ((sizeof(v) * CHAR_BIT) - p - 1);
	return leading | (vn >> p);
}

static inline d_t divn(const d_t v, const unsigned p) {
	/* return v / (1l << p); */
	const u_t shifted = ((u_t)v) >> p;
	if (qispositive(v))
		return shifted;
	const u_t leading = ((u_t)(-1l)) << ((sizeof(v)*CHAR_BIT) - p - 1);
	return leading | shifted;
}

/* These really all should be moved the header for efficiency reasons */
static inline u_t qhigh(const q_t q) { return ((u_t)q) >> QBITS; }
static inline u_t qlow(const q_t q)  { return ((u_t)q) & QMASK; }
static inline q_t qcons(const u_t hi, const u_t lo) { return (hi << QBITS) | (lo & QMASK); }

int qtoi(const q_t toi)                 { return ((lu_t)((ld_t)toi)) >> QBITS; }
q_t qint(const int toq)                 { return ((u_t)((d_t)toq)) << QBITS; }
signed char qtoc(const q_t q)           { return qtoi(q); }
q_t qchar(signed char c)                { return qint(c); }
short qtoh(const q_t q)                 { return qtoi(q); }
q_t qshort(short s)                     { return qint(s); }
long qtol(const q_t q)                  { return qtoi(q); }
q_t qlong(long l)                       { return qint(l); }
long long qtoll(const q_t q)            { return qtoi(q); }
q_t qvlong(long long ll)                { return qint(ll); }

q_t qisnegative(const q_t a)            { return QINT(BOOLIFY(qhigh(a) & QHIGH)); }
q_t qispositive(const q_t a)            { return QINT(!(qhigh(a) & QHIGH)); }
q_t qisinteger(const q_t a)             { return QINT(!qlow(a)); }
q_t qisodd(const q_t a)                 { return QINT(qisinteger(a) &&  (qhigh(a) & 1)); }
q_t qiseven(const q_t a)                { return QINT(qisinteger(a) && !(qhigh(a) & 1)); }
q_t qless(const q_t a, const q_t b)     { return QINT(a < b); }
q_t qeqless(const q_t a, const q_t b)   { return QINT(a <= b); }
q_t qmore(const q_t a, const q_t b)     { return QINT(a > b); }
q_t qeqmore(const q_t a, const q_t b)   { return QINT(a >= b); }
q_t qequal(const q_t a, const q_t b)    { return QINT(a == b); }
q_t qunequal(const q_t a, const q_t b)  { return QINT(a != b); }

q_t qnegate(const q_t a)                { return (~(u_t)a) + 1ULL; }
q_t qmin(const q_t a, const q_t b)      { return qless(a, b) ? a : b; }
q_t qmax(const q_t a, const q_t b)      { return qmore(a, b) ? a : b; }
q_t qabs(const q_t a)                   { return qisnegative(a) ? qnegate(a) : a; }
q_t qadd(const q_t a, const q_t b)      { return qsat((ld_t)a + (ld_t)b); }
q_t qsub(const q_t a, const q_t b)      { return qsat((ld_t)a - (ld_t)b); }
q_t qcopysign(const q_t a, const q_t b) { return qisnegative(b) ? qnegate(qabs(a)) : qabs(a); }
q_t qand(const q_t a, const q_t b)      { return a & b; }
q_t qxor(const q_t a, const q_t b)      { return a ^ b; }
q_t qor(const q_t a, const q_t b)       { return a | b; }
q_t qinvert(const q_t a)                { return ~a; }
q_t qnot(const q_t a)                   { return QINT(!a); }
q_t qlogical(const q_t a)               { return QINT(BOOLIFY(a)); }

q_t qlrs(const q_t a, const q_t b)      { /* assert low bits == 0? */ return (u_t)a >> (u_t)qtoi(b); }
q_t qlls(const q_t a, const q_t b)      { return (u_t)a << b; }
q_t qars(const q_t a, const q_t b)      { return arshift(a, qtoi(b)); }
q_t qals(const q_t a, const q_t b)      { return qsat((lu_t)a << b); }
q_t qsign(const q_t a)                  { return qisnegative(a) ? -QINT(1) : QINT(1); }
q_t qsignum(const q_t a)                { return a ? qsign(a) : QINT(0); }

q_t qapproxequal(const q_t a, const q_t b, const q_t epsilon) {
	assert(qeqmore(epsilon, qint(0))); 
	return QINT(qless(qabs(qsub(a, b)), epsilon)); 
}

q_t qapproxunequal(const q_t a, const q_t b, const q_t epsilon) { 
	return QINT(!qapproxequal(a, b, epsilon));
}

q_t qwithin(q_t v, q_t b1, q_t b2) {
	const q_t hi = qmax(b1, b2);
	const q_t lo = qmin(b1, b2);
	if (qequal(v, b1) || qequal(v, b2))
		return 1;
	return qless(v, hi) && qmore(v, lo) ? QINT(1) : QINT(0);
}

q_t qwithin_interval(q_t v, q_t expected, q_t allowance) {
	const q_t b1 = qadd(expected, allowance);
	const q_t b2 = qsub(expected, allowance);
	return qwithin(v, b1, b2);
}

q_t qfloor(const q_t q) {
	return q & ~QMASK;
}

q_t qceil(q_t q) {
	const q_t adj = qisinteger(q) ? QINT(0) : QINT(1);
	q = qadd(q, adj);
	return ((u_t)q) & (QMASK << QBITS);
}

q_t qtrunc(q_t q) {
	const q_t adj = qisnegative(q) && qlow(q) ? QINT(1) : QINT(0);
	q = qadd(q, adj);
	return ((u_t)q) & (QMASK << QBITS);
}

q_t qround(q_t q) {
	const int negative = qisnegative(q);
	q = qabs(q);
	const q_t adj = (qlow(q) & QHIGH) ? QINT(1) : QINT(0);
	q = qadd(q, adj);
	q = ((u_t)q) & (QMASK << QBITS);
	return negative ? qnegate(q) : q;
}

int qpack(const q_t *q, char *buffer, const size_t length) {
	assert(buffer);
	if (length < sizeof(*q))
		return -1;
	q_t qn = *q;
	uint8_t *b = (uint8_t*)buffer;
	for (size_t i = 0; i < sizeof(qn); i++) {
		b[i] = qn;
		qn = (u_t)qn >> CHAR_BIT;
	}
	return sizeof(qn);
}

int qunpack(q_t *q, const char *buffer, const size_t length) {
	assert(q);
	assert(buffer);
	if (length < sizeof(*q))
		return -1;
	uint8_t *b = (uint8_t*)buffer;
	u_t nq = 0;
	for (size_t i = 0; i < sizeof(*q); i++) {
		nq <<= CHAR_BIT;
		nq |= b[sizeof(*q)-i-1];
	}
	*q = nq;
	return sizeof(*q);
}

static inline ld_t multiply(const q_t a, const q_t b) {
	const ld_t dd = ((ld_t)a * (ld_t)b) + (lu_t)QHIGH;
	/* N.B. portable version of "dd >> QBITS", for double width signed values */
	return dd < 0 ? (-1ull << (2 * QBITS)) | ((lu_t)dd >> QBITS) : ((lu_t)dd) >> QBITS;
}

q_t qmul(const q_t a, const q_t b) {
	return qsat(multiply(a, b));
}

q_t qfma(const q_t a, const q_t b, const q_t c) {
	return qsat(multiply(a, b) + (ld_t)c);
}

q_t qdiv(const q_t a, const q_t b) {
	assert(b);
	const ld_t dd = ((ld_t)a) << QBITS;
	ld_t bd2 = divn(b, 1);
	if (!((dd >= 0 && b > 0) || (dd < 0 && b < 0)))
		bd2 = -bd2;
	/* Overflow not checked! */
	/*return (dd/b) + (bd2/b);*/
	return (dd + bd2) / b;
}

q_t qrem(const q_t a, const q_t b) {
	return qsub(a, qmul(qtrunc(qdiv(a, b)), b));
}

q_t qmod(q_t a, q_t b) {
	return qsub(a, qmul(qfloor(qdiv(a, b)), b));
}

static char itoch(const unsigned ch) {
	assert(ch < 36);
	if (ch <= 9)
		return ch + '0';
	return ch + 'A' - 10;
}

static inline void swap(char *a, char *b) {
	assert(a);
	assert(b);
	const int c = *a;
	*a = *b;
	*b = c;
}

static void reverse(char *s, const size_t length) {
	assert(s);
	for (size_t i = 0; i < length/2; i++)
		swap(&s[i], &s[length - i - 1]);
}

static int uprint(u_t p, char *s, const size_t length, const d_t base) {
	assert(s);
	assert(base >= 2 && base <= 36);
	if (length < 2)
		return -1;
	size_t i = 0;
	do {
		unsigned ch = p % base;
		p /= base;
		s[i++] = itoch(ch);
	} while (p && i < length);
	if (p && i >= length)
		return -1;
	reverse(s, i);
	return i;
}

/* <https://codereview.stackexchange.com/questions/109212> */
int qsprintbdp(q_t p, char *s, size_t length, const u_t base, const d_t idp) {
	assert(s);
	const int negative = BOOLIFY(qisnegative(p));
	if (negative)
		p = qnegate(p);
	const d_t hi = qhigh(p);
	char frac[QBITS + 2] = { '.', };
	memset(s, 0, length);
	assert(base >= 2 && base <= 36);
	u_t lo = qlow(p);
	size_t i = 1;
	for (i = 1; lo; i++) {
		if (idp >= 0 && (int)i > idp)
			break;
		lo *= base;
		assert(i < (QBITS + 2));
		frac[i] = itoch(lo >> QBITS);
		lo &= QMASK;
	}
	if (negative)
		s[0] = '-';
	const int hisz = uprint(hi, s + negative, length - (1 + negative), base);
	if (hisz < 0 || (hisz + i + negative + 1) > length)
		return -1;
	memcpy(s + hisz + negative, frac, i);
	return i + hisz;
}

int qsprintb(q_t p, char *s, size_t length, const u_t base) {
	return qsprintbdp(p, s, length, base, qconf.dp);
}

int qsprint(const q_t p, char *s, const size_t length) {
	return qsprintb(p, s, length, qconf.base); 
}

static inline int extract(unsigned char c, const int radix) {
	c = tolower(c);
	if (c >= '0' && c <= '9')
		c -= '0';
	else if (c >= 'a' && c <= 'z')
		c -= ('a' - 10);
	else
		return -1;
	if (c < radix)
		return c;
	return -1;
}

static inline q_t qmk(d_t integer, u_t fractional) {
	const int negative = integer < 0;
	integer = negative ? -integer : integer;
	const q_t r = qcons((d_t)integer, fractional);
	return negative ? qnegate(r) : r;
}

static inline u_t integer_logarithm(u_t num, const u_t base) {
	assert(num > 0 && base >= 2 && base <= 36);
	u_t r = -1;
	do r++; while (num /= base);
	return r;
}

int qnconvbdp(q_t *q, const char *s, size_t length, const d_t base, const u_t idp) {
	assert(q);
	assert(s);
	assert(base >= 2 && base <= 36);
	*q = QINT(0);
	if (length < 1)
		return -1;
	d_t hi = 0, lo = 0, places = 1, negative = 0, overflow = 0;
	size_t sidx = 0;

	if (s[sidx] == '-') {
		if (length < 2)
			return -1;
		negative = 1;
		sidx++;
	}

	for (; sidx < length && s[sidx]; sidx++) {
		const d_t e = extract(s[sidx], base);
		if (e < 0)
			break;
		if (hi > MULTIPLIER) { /* continue on with conversion, do not accumulate */
			overflow = 1;
		} else { 
			hi = (hi * base) + e;
		}
	}
	if (sidx >= length || !s[sidx])
		goto done;
	if (s[sidx] != '.')
		return -2;
	sidx++;
	
	const u_t ilog = integer_logarithm(0x10000, base);
	const u_t max = MIN(idp, ilog); /* Calculate maximum decimal places given base */

	for (u_t dp = 0; sidx < length && s[sidx]; sidx++, dp++) {
		const int ch = extract(s[sidx], base);
		if (ch < 0)
			return -3;
		if (dp < max) { /* continue on with conversion , do not accumulate */
			/* We could get more accuracy by looking at one digit
			 * passed the maximum digits allowed and rounding if
			 * that digit exists in the input. */
			lo = (lo * base) + ch;
			if (places >= (DMAX / base))
				return -4;
			places *= base;
		}
		assert((dp + 1) > dp);
	}
	if (!places)
		return -5;
	lo = ((d_t)((u_t)lo << QBITS) / places);
done:
	if (overflow) {
		*q = negative ? qinfo.min : qinfo.max;
		return -6;
	} else {
		const q_t nq = qmk(hi, lo);
		*q = negative ? qnegate(nq) : nq;

	}
	return 0;
}

int qnconvb(q_t *q, const char *s, size_t length, const d_t base) {
	return qnconvbdp(q, s, length, base, qconf.dp);
}

int qnconv(q_t *q, const char *s, size_t length) {
	return qnconvb(q, s, length, qconf.base);
}

int qconv(q_t *q, const char * const s) {
	assert(s);
	return qnconv(q, s, strlen(s));
}

int qconvb(q_t *q, const char * const s, const d_t base) {
	assert(s);
	return qnconvb(q, s, strlen(s), base);
}

typedef enum {
	CORDIC_MODE_VECTOR_E/* = 'VECT'*/,
	CORDIC_MODE_ROTATE_E/* = 'ROT'*/,
} cordic_mode_e;

typedef enum {
	CORDIC_COORD_HYPERBOLIC_E = -1,
	CORDIC_COORD_LINEAR_E     =  0,
	CORDIC_COORD_CIRCULAR_E   =  1,
} cordic_coordinates_e;

static const d_t cordic_circular_inverse_scaling   = 0x9B74; /* 1/scaling-factor */
static const d_t cordic_hyperbolic_inverse_scaling = 0x13520; /* 1/scaling-factor */

static inline int mulsign(d_t a, d_t b) { /* sign(a*b) */
	const int aneg = a < 0;
	const int bneg = b < 0;
	return aneg ^ bneg ? -QINT(1) : QINT(1);
}

/* Universal CORDIC <https://en.wikibooks.org/wiki/Digital_Circuits/CORDIC>
 *
 *	x(i+1) = x(i) - u.d(i).y(i).pow(2, -i)
 * 	y(i+1) = y(i) +   d(i).x(i).pow(2, -i)
 * 	z(i+1) = z(i) -   d(i).a(i)
 *
 *  d(i) =  sgn(z(i))      (rotation)
 *  d(i) = -sgn(x(i).y(i)) (vectoring)
 *
 *             hyperbolic      linear          circular
 *  u =                -1           0                 1
 *  a = atanh(pow(2, -i))  pow(2, -i)  atan(pow(2, -i))
 *
 *  linear shift sequence:      i = 0, 1, 2, 3, ...
 *  circular shift sequence:    i = 1, 2, 3, 4, ...
 *  hyperbolic shift sequence:  i = 1, 2, 3, 4, 4, 5, ... */
static int cordic(const cordic_coordinates_e coord, const cordic_mode_e mode, int iterations, d_t *x0, d_t *y0, d_t *z0) {
	assert(x0);
	assert(y0);
	assert(z0);
	if (mode != CORDIC_MODE_VECTOR_E && mode != CORDIC_MODE_ROTATE_E)
		return -1;

	BUILD_BUG_ON(sizeof(d_t) != sizeof(uint32_t));
	BUILD_BUG_ON(sizeof(u_t) != sizeof(uint32_t));

	static const u_t arctans[] = { /* atan(2^0), atan(2^-1), atan(2^-2), ... */
		0xC90FuL, 0x76B1uL, 0x3EB6uL, 0x1FD5uL,
		0x0FFAuL, 0x07FFuL, 0x03FFuL, 0x01FFuL,
		0x00FFuL, 0x007FuL, 0x003FuL, 0x001FuL,
		0x000FuL, 0x0007uL, 0x0003uL, 0x0001uL,
		0x0000uL, // 0x0000uL,
	};
	static const size_t arctans_length = sizeof arctans / sizeof arctans[0];

	static const u_t arctanhs[] = { /* atanh(2^-1), atanh(2^-2), ... */
		0x8c9fuL, 0x4162uL, 0x202buL, 0x1005uL,
		0x0800uL, 0x0400uL, 0x0200uL, 0x0100uL,
		0x0080uL, 0x0040uL, 0x0020uL, 0x0010uL,
		0x0008uL, 0x0004uL, 0x0002uL, 0x0001uL,
		0x0000uL, // 0x0000uL,
	};
	static const size_t arctanhs_length = sizeof arctanhs / sizeof arctanhs[0];

	static const u_t halfs[] = { /* 2^0, 2^-1, 2^-2, ..*/
		0x10000uL,
		0x8000uL, 0x4000uL, 0x2000uL, 0x1000uL,
		0x0800uL, 0x0400uL, 0x0200uL, 0x0100uL,
		0x0080uL, 0x0040uL, 0x0020uL, 0x0010uL,
		0x0008uL, 0x0004uL, 0x0002uL, 0x0001uL,
		//0x0000uL, // 0x0000uL,
	};
	static const size_t halfs_length = sizeof halfs / sizeof halfs[0];

	const u_t *lookup = NULL;
	size_t i = 0, j = 0, k = 0, length = 0;
	const size_t *shiftx = NULL, *shifty = NULL;
	int hyperbolic = 0;

	switch (coord) {
	case CORDIC_COORD_CIRCULAR_E:
		lookup = arctans;
		length = arctans_length;
		i = 0;
		shifty = &i;
		shiftx = &i;
		break;
	case CORDIC_COORD_HYPERBOLIC_E:
		lookup = arctanhs;
		length = arctanhs_length;
		hyperbolic = 1;
		i = 1;
		shifty = &i;
		shiftx = &i;
		break;
	case CORDIC_COORD_LINEAR_E:
		lookup = halfs;
		length = halfs_length;
		shifty = &j;
		shiftx = NULL;
		i = 1;
		break;
	default: /* not implemented */
		return -2;
	}

	iterations = iterations > (int)length ? (int)length : iterations;
	iterations = iterations < 0           ? (int)length : iterations;

	d_t x = *x0, y = *y0, z = *z0;

	/* rotation mode: z determines direction,
	 * vector mode:   y determines direction */
	for (; j < (unsigned)iterations; i++, j++) {
		again:
		{
			const d_t  m = mode == CORDIC_MODE_ROTATE_E ? z : -y /*-mulsign(x, y)*/;
			const d_t  d =   -!!(m < 0);
			const d_t xs = ((((shiftx ? divn(y, *shiftx) : 0)) ^ d) - d);
			const d_t ys =             (divn(x, *shifty)       ^ d) - d;
			const d_t xn = x - (hyperbolic ? -xs : xs);
			const d_t yn = y + ys;
			const d_t zn = z - ((lookup[j] ^ d) - d);
			x = xn; /* cosine, in circular, rotation mode */
			y = yn; /*   sine, in circular, rotation mode   */
			z = zn;
		}
		if (hyperbolic) { /* Experimental/Needs bug fixing */
			switch (1) { // TODO: Correct hyperbolic redo of iteration
			case 0: break;
			case 1: if (k++ >= 3) { k = 0; goto again; } break;
			case 2: {
				assert(j <= 120);
				size_t cmp = j + 1;
				if (cmp == 4 || cmp == 13 /*|| cmp == 40 || cmp == 121 || cmp == floor(pow(3,i-1)/2) */) {
					if (k) {
						k = 0;
					} else {
						k = 1;
						goto again;
					}
				}
				break;
			}
			}
		}
	}
	*x0 = x;
	*y0 = y;
	*z0 = z;

	return iterations;
}

/* See: - <https://dspguru.com/dsp/faqs/cordic/>
 *      - <https://en.wikipedia.org/wiki/CORDIC> */
static int qcordic(q_t theta, const int iterations, q_t *sine, q_t *cosine) {
	assert(sine);
	assert(cosine);

	static const q_t   pi =   QPI,    npi =  -QPI;
	static const q_t  hpi =   QPI/2, hnpi = -(QPI/2);
	static const q_t  qpi =   QPI/4, qnpi = -(QPI/4);
	static const q_t  dpi =   QPI*2, dnpi = -(QPI*2);

	/* Convert to range -pi   to pi, we could use qmod,
	 * however that uses multiplication and division, and
	 * if we can use those operators freely then there are
	 * other, better algorithms we can use instead of CORDIC
	 * for sine/cosine calculation. */
	while (qless(theta, npi)) theta = qadd(theta,  dpi);
	while (qmore(theta,  pi)) theta = qadd(theta, dnpi);

	int negate = 0, shift = 0;

	/* convert to range -pi/2 to pi/2 */
	if (qless(theta, hnpi)) {
		theta = qadd(theta,  pi);
		negate = 1;
	} else if (qmore(theta, hpi)) {
		theta = qadd(theta, npi);
		negate = 1;
	}

	/* convert to range -pi/4 to pi/4 */
	if (qless(theta, qnpi)) {
		theta = qadd(theta,  hpi);
		shift = -1;
	} else if (qmore(theta, qpi)) {
		theta = qadd(theta, hnpi);
		shift =  1;
	}

	d_t x = cordic_circular_inverse_scaling, y = 0, z = theta /* no theta scaling needed */;

	/* CORDIC in Q2.16 format */
	if (cordic(CORDIC_COORD_CIRCULAR_E, CORDIC_MODE_ROTATE_E, iterations, &x, &y, &z) < 0)
		return -1;

	/* undo shifting and quadrant changes */
	if (shift > 0) {
		const d_t yt = y;
		y =  x;
		x = -yt;
	} else if (shift < 0) {
		const d_t yt = y;
		y = -x;
		x =  yt;
	}

	if (negate) {
		x = -x;
		y = -y;
	}
	/* set output; no scaling needed */
	*cosine = x;
	  *sine = y;
	return 0;
}

q_t qatan(const q_t t) {
	q_t x = qint(1), y = t, z = QINT(0);
	cordic(CORDIC_COORD_CIRCULAR_E, CORDIC_MODE_VECTOR_E, -1, &x, &y, &z);
	return z;
}

q_t qatan2(const q_t a, const q_t b) {
	q_t x = b, y = a, z = QINT(0);
	if (qequal(b, QINT(0))) {
		assert(qunequal(a, QINT(0)));
		if (qmore(a, QINT(0)))
			return QPI/2;
		return -(QPI/2);
	} else if (qless(b, QINT(0))) {
		if (qeqmore(a, QINT(0)))
			return qadd(qatan(qdiv(a, b)), QPI);
		return qsub(qatan(qdiv(a, b)), QPI);
	}
	cordic(CORDIC_COORD_CIRCULAR_E, CORDIC_MODE_VECTOR_E, -1, &x, &y, &z);
	return z;
}

void qsincos(q_t theta, q_t *sine, q_t *cosine) {
	assert(sine);
	assert(cosine);
	const int r = qcordic(theta, -1, sine, cosine);
	assert(r >= 0);
}

q_t qsin(const q_t theta) {
	q_t sine = QINT(0), cosine = QINT(0);
	qsincos(theta, &sine, &cosine);
	return sine;
}

q_t qcos(const q_t theta) {
	q_t sine = QINT(0), cosine = QINT(0);
	qsincos(theta, &sine, &cosine);
	return cosine;
}

q_t qtan(const q_t theta) {
	q_t sine = QINT(0), cosine = QINT(0);
	qsincos(theta, &sine, &cosine);
	return qdiv(sine, cosine); /* can use qcordic_div, with range limits it imposes */
}

q_t qcot(const q_t theta) {
	q_t sine = QINT(0), cosine = QINT(0);
	qsincos(theta, &sine, &cosine);
	return qdiv(cosine, sine); /* can use qcordic_div, with range limits it imposes */
}

q_t qcordic_mul(const q_t a, const q_t b) { /* works for small values; result < 4 */
	q_t x = a, y = QINT(0), z = b;
	const int r = cordic(CORDIC_COORD_LINEAR_E, CORDIC_MODE_ROTATE_E, -1, &x, &y, &z);
	assert(r >= 0);
	return y;
}

q_t qcordic_div(const q_t a, const q_t b) {
	q_t x = b, y = a, z = QINT(0);
	const int r = cordic(CORDIC_COORD_LINEAR_E, CORDIC_MODE_VECTOR_E, -1, &x, &y, &z);
	assert(r >= 0);
	return z;
}

void qsincosh(const q_t a, q_t *sinh, q_t *cosh) {
	assert(sinh);
	assert(cosh);
	q_t x = cordic_hyperbolic_inverse_scaling, y = QINT(0), z = a; /* (e^2x - 1) / (e^2x + 1) */
	const int r = cordic(CORDIC_COORD_HYPERBOLIC_E, CORDIC_MODE_ROTATE_E, -1, &x, &y, &z);
	assert(r >= 0);
	*sinh = y;
	*cosh = x;
}

q_t qtanh(const q_t a) {
	q_t sinh = QINT(0), cosh = QINT(0);
	qsincosh(a, &sinh, &cosh);
	return qdiv(sinh, cosh);
}

q_t qcosh(const q_t a) {
	q_t sinh = QINT(0), cosh = QINT(0);
	qsincosh(a, &sinh, &cosh);
	return cosh;
}

q_t qsinh(const q_t a) {
	q_t sinh = QINT(0), cosh = QINT(0);
	qsincosh(a, &sinh, &cosh);
	return sinh;
}

q_t qcordic_exp(const q_t e) {
	q_t s = QINT(0), h = QINT(0);
	qsincosh(e, &s, &h);
	return qadd(s, h);
}

q_t qcordic_ln(const q_t d) {
	q_t x = qadd(d, QINT(1)), y = qsub(d, QINT(1)), z = QINT(0);
	const int r = cordic(CORDIC_COORD_HYPERBOLIC_E, CORDIC_MODE_VECTOR_E, -1, &x, &y, &z);
	assert(r >= 0);
	return qadd(z, z);
}

q_t qcordic_sqrt(const q_t n) {  /* testing only; works for 0 < x < 2 */
	const q_t quarter = 1uLL << (QBITS - 2); /* 0.25 */
	q_t x = qadd(n, quarter),
	    y = qsub(n, quarter),
	    z = 0;
	const int r = cordic(CORDIC_COORD_HYPERBOLIC_E, CORDIC_MODE_VECTOR_E, -1, &x, &y, &z);
	assert(r >= 0);
	return qmul(x, cordic_hyperbolic_inverse_scaling);
}

q_t qhypot(const q_t a, const q_t b) {
	q_t x = qabs(a), y = qabs(b), z = QINT(0); /* abs() should not be needed? */
	const int r = cordic(CORDIC_COORD_CIRCULAR_E, CORDIC_MODE_VECTOR_E, -1, &x, &y, &z);
	assert(r >= 0);
	return qmul(x, cordic_circular_inverse_scaling);
}

q_t qatanh(q_t x) {
	assert(qabs(qless(x, QINT(1))));
	return qmul(qlog(qdiv(qadd(QINT(1), x), qsub(QINT(1), x))), QMK(0, 0x8000, 16));
}

q_t qasinh(q_t x) {
	return qlog(qadd(x, qsqrt(qadd(qmul(x, x), QINT(1)))));
}

q_t qacosh(q_t x) {
	assert(qeqmore(x, QINT(1)));
	return qlog(qadd(x, qsqrt(qsub(qmul(x, x), QINT(1)))));
}

void qpol2rec(const q_t magnitude, const q_t theta, q_t *i, q_t *j) {
	assert(i);
	assert(j);
	q_t sin = QINT(0), cos = QINT(0);
	qsincos(theta, &sin, &cos);
	*i = qmul(sin, magnitude);
	*j = qmul(cos, magnitude);
}

void qrec2pol(const q_t i, const q_t j, q_t *magnitude, q_t *theta) {
	assert(magnitude);
	assert(theta);
	const int is = qisnegative(i), js = qisnegative(j);
	q_t x = qabs(i), y = qabs(j), z = QINT(0);
	const int r = cordic(CORDIC_COORD_CIRCULAR_E, CORDIC_MODE_VECTOR_E, -1, &x, &y, &z);
	assert(r >= 0);
	*magnitude = qmul(x, cordic_circular_inverse_scaling);
	if (is && js)
		z = qadd(z, QPI);
	else if (js)
		z = qadd(z, QPI/2l);
	else if (is)
		z = qadd(z, (3l*QPI)/2l);
	*theta = z;
}

q_t qcordic_hyperbolic_gain(const int n) {
	q_t x = QINT(1), y = QINT(0), z = QINT(0);
	const int r = cordic(CORDIC_COORD_HYPERBOLIC_E, CORDIC_MODE_ROTATE_E, n, &x, &y, &z);
	assert(r >= 0);
	return x;
}

q_t qcordic_circular_gain(const int n) {
	q_t x = QINT(1), y = QINT(0), z = QINT(0);
	const int r = cordic(CORDIC_COORD_CIRCULAR_E, CORDIC_MODE_ROTATE_E, n, &x, &y, &z);
	assert(r >= 0);
	return x;
}

static inline int isodd(const unsigned n) {
	return n & 1;
}

d_t dpower(d_t b, unsigned e) { /* https://stackoverflow.com/questions/101439 */
    d_t result = 1;
    for (;;) {
        if (isodd(e))
            result *= b;
        e >>= 1;
        if (!e)
            break;
        b *= b;
    }
    return result;
}

d_t dlog(d_t x, const unsigned base) { /* rounds up, look at remainder to round down */
	d_t b = 0;
	assert(x && base > 1);
	while ((x /= (d_t)base)) /* can use >> for base that are powers of two */
		b++;
	return b;
}

q_t qlog(q_t x) {
	q_t logs = 0;
	assert(qmore(x, 0));
	static const q_t lmax = QMK(9, 0x8000, 16); /* 9.5, lower limit needs checking */
	for (; qmore(x, lmax); x = divn(x, 1))
		logs = qadd(logs, qinfo.ln2);
	return qadd(logs, qcordic_ln(x));
}

q_t qsqr(const q_t x) {
	return qmul(x, x);
}

q_t qexp(const q_t e) { /* exp(e) = exp(e/2)*exp(e/2) */
	if (qless(e, QINT(1))) /* 1.1268 is approximately the limit for qcordic_exp */
		return qcordic_exp(e);
	return qsqr(qexp(divn(e, 1)));
}

q_t qpow(q_t n, q_t exp) {
	implies(qisnegative(n), qisinteger(exp));
	implies(qequal(n, QINT(0)), qunequal(exp, QINT(0)));
	if (qequal(QINT(0), n))
		return QINT(1);
	if (qisnegative(n)) {
		const q_t abspow = qpow(qabs(n), exp);
		return qisodd(exp) ? qnegate(abspow) : abspow;
	}
	if (qisnegative(exp))
		return qdiv(QINT(1), qpow(n, qabs(exp)));
	return qexp(multiply(qlog(n), exp));
}

q_t qsqrt(const q_t x) { /* Newton-Rhaphson method */
	assert(qeqmore(x, 0));
	const q_t difference = qmore(x, QINT(100)) ? 0x0100 : 0x0010;
	if (qequal(QINT(0), x))
		return QINT(0);
	q_t guess = qmore(x, qinfo.sqrt2) ? divn(x, 1) : QINT(1);
	while (qmore(qabs(qsub(qmul(guess, guess), x)), difference))
		guess = divn(qadd(qdiv(x, guess), guess), 1);
	return qabs(guess); /* correct for overflow int very large numbers */
}

q_t qasin(const q_t t) {
	assert(qless(qabs(t), QINT(1)));
	/* can also use: return qatan(qdiv(t, qsqrt(qsub(QINT(1), qmul(t, t))))); */
	return qatan2(t, qsqrt(qsub(QINT(1), qmul(t, t))));
}

q_t qacos(const q_t t) {
	assert(qeqless(qabs(t), QINT(1)));
	/* can also use: return qatan(qdiv(qsqrt(qsub(QINT(1), qmul(t, t))), t)); */
	return qatan2(qsqrt(qsub(QINT(1), qmul(t, t))), t);
}

q_t qdeg2rad(const q_t deg) {
	return qdiv(qmul(QPI, deg), QINT(180));
}

q_t qrad2deg(const q_t rad) {
	return qdiv(qmul(QINT(180), rad), QPI);
}

void qfilter_init(qfilter_t *f, const q_t time, const q_t rc, const q_t seed) {
	assert(f);
	memset(f, 0, sizeof(*f));
	f->time = time;
	f->rc = rc;
	f->filtered = seed; /* alpha * seed for LPF */
	f->raw = seed;
}

q_t qfilter_low_pass(qfilter_t *f, const q_t time, const q_t data) {
	assert(f);
	/* If the calling rate is constant (for example the function is
	 * guaranteed to be always called at a rate of 5 milliseconds) we
	 * can avoid the costly alpha calculation! */
	const q_t dt = (u_t)time - (u_t)f->time;
	const q_t alpha = qdiv(dt, qadd(f->rc, dt));
	f->filtered = qfma(alpha, qsub(data, f->filtered), f->filtered);
	f->time = time;
	f->raw  = data;
	return f->filtered;
}

q_t qfilter_high_pass(qfilter_t *f, const q_t time, const q_t data) {
	assert(f);
	const q_t dt = (u_t)time - (u_t)f->time;
	const q_t alpha = qdiv(f->rc, qadd(f->rc, dt));
	f->filtered = qmul(alpha, qadd(f->filtered, qsub(data, f->raw)));
	f->time = time;
	f->raw  = data;
	return f->filtered;
}

q_t qfilter_value(const qfilter_t *f) {
	assert(f);
	return f->filtered;
}

/* Must be called at a constant rate; perhaps a PID which takes call time
 * into account could be made, but that would complicate things. Differentiator
 * term needs filtering also. It would be nice to create a version that took
 * into account the time delta, see
 * <https://www.quora.com/Do-I-need-to-sample-at-a-constant-rate-for-PID-control-or-is-it-sufficient-to-know-the-time-at-which-my-sample-was-taken-even-if-the-increment-varies>
 * */
q_t qpid_update(qpid_t *pid, const q_t error, const q_t position) {
	assert(pid);
	const q_t p  = qmul(pid->p_gain, error);
	pid->i_state = qadd(pid->i_state, error);
	pid->i_state = qmax(pid->i_state, pid->i_min);
	pid->i_state = qmin(pid->i_state, pid->i_max);
	const q_t i  = qmul(pid->i_state, pid->i_gain);
	const q_t d  = qmul(pid->d_gain, qsub(position, pid->d_state));
	pid->d_state = position;
	return qsub(qadd(p, i), d);
}

/* Simpsons method for numerical integration, from "Math Toolkit for 
 * Real-Time Programming" by Jack Crenshaw */
q_t qsimpson(q_t (*f)(q_t), const q_t x1, const q_t x2, const unsigned n) {
	assert(f);
	assert((n & 1) == 0);
	const q_t h = qdiv(qsub(x2, x1), QINT(n));
	q_t sum = 0, x = x1;
	for (unsigned i = 0; i < (n / 2u); i++){
		sum = qadd(sum, qadd(f(x), qmul(QINT(2), f(qadd(x,h)))));
		x   = qadd(x, qmul(QINT(2), h));
	}
	sum = qsub(qmul(QINT(2), sum), qadd(f(x1), f(x2)));
	return qdiv(qmul(h, sum), QINT(3));
}

/* The matrix meta-data field is not used at the moment, but could be
 * used for things like versioning, determining whether the matrix is
 * all zeros, or is the identify matrix, whether it contains valid data,
 * and more. Some common matrix operations are missing, such as factorization 
 *
 * A function for image kernels might be useful. */

enum { METADATA, LENGTH, ROW, COLUMN, DATA, };

int qmatrix_is_valid(const q_t *m) {
	const size_t size = m[LENGTH], row = m[ROW], column = m[COLUMN];
	const size_t elements = row * column;
	if (elements < row || elements < column) /* overflow */
		return 0;
	if (elements > size)
		return 0;
	return 1;
}

int qmatrix_resize(q_t *m, const size_t row, const size_t column) {
	const size_t rc = row * column;
	const size_t sz = m[LENGTH];
	if ((row && column) && (rc < row || rc < column)) /* overflow */
		return -1;
	if (rc > sz)
		return -1;
	m[ROW]    = row;
	m[COLUMN] = column;
	return 0;
}

int qmatrix_apply_unary(q_t *r, const q_t *a, q_t (*func)(q_t)) {
	assert(r);
	assert(qmatrix_is_valid(r));
	assert(a);
	assert(qmatrix_is_valid(a));
	assert(func);
       	const q_t *ma = &a[DATA];
	q_t *mr = &r[DATA];
	const size_t arows = a[ROW], acolumns = a[COLUMN];
	if (qmatrix_resize(r, arows, acolumns) < 0)
		return -1;
	for (size_t i = 0; i < arows; i++)
		for (size_t j = 0; j < acolumns; j++)
			mr[i*acolumns + j] = func(ma[i*acolumns + j]);
	return 0;
}

int qmatrix_apply_scalar(q_t *r, const q_t *a, q_t (*func)(q_t, q_t), const q_t c) {
	assert(r);
	assert(qmatrix_is_valid(r));
	assert(a);
	assert(qmatrix_is_valid(a));
	assert(func);
       	const q_t *ma = &a[DATA];
	q_t *mr = &r[DATA];
	const size_t arows = a[ROW], acolumns = a[COLUMN];
	if (qmatrix_resize(r, arows, acolumns) < 0)
		return -1;
	for (size_t i = 0; i < arows; i++)
		for (size_t j = 0; j < acolumns; j++)
			mr[i*acolumns + j] = func(ma[i*acolumns + j], c);
	return 0;
}

int qmatrix_apply_binary(q_t *r, const q_t *a, const q_t *b, q_t (*func)(q_t, q_t)) {
	assert(a);
	assert(qmatrix_is_valid(a));
	assert(b);
	assert(qmatrix_is_valid(b));
	assert(r);
	assert(qmatrix_is_valid(r));
	assert(func);
       	const q_t *ma = &a[DATA], *mb = &b[DATA];
	q_t *mr = &r[DATA];
	const size_t arows = a[ROW], acolumns = a[COLUMN];
	const size_t brows = b[ROW], bcolumns = b[COLUMN];
	const size_t rrows = r[ROW], rcolumns = r[COLUMN];
	if (arows != brows || acolumns != bcolumns)
		return -1;
	if (arows != rrows || acolumns != rcolumns)
		return -1;
	for (size_t i = 0; i < arows; i++)
		for (size_t j = 0; j < acolumns; j++) {
			const size_t idx = (i*acolumns) + j;
			mr[idx] = func(ma[idx], mb[idx]); 
		}
	return 0;
}

static q_t qfz(q_t a) { UNUSED(a); return QINT(0); }
static q_t qf1(q_t a) { UNUSED(a); return QINT(1); }

int qmatrix_zero(q_t *r)    { return qmatrix_apply_unary(r, r, qfz); }
int qmatrix_one(q_t *r)     { return qmatrix_apply_unary(r, r, qf1); }
int qmatrix_logical(q_t *r, const q_t *a) { return qmatrix_apply_unary(r, a, qlogical); }
int qmatrix_not(q_t *r, const q_t *a)     { return qmatrix_apply_unary(r, a, qnot); }
int qmatrix_signum(q_t *r, const q_t *a)  { return qmatrix_apply_unary(r, a, qsignum); }
int qmatrix_invert(q_t *r, const q_t *a)  { return qmatrix_apply_unary(r, a, qinvert); }
int qmatrix_add(q_t *r, const q_t *a, const q_t *b) { return qmatrix_apply_binary(r, a, b, qadd); }
int qmatrix_sub(q_t *r, const q_t *a, const q_t *b) { return qmatrix_apply_binary(r, a, b, qsub); }
int qmatrix_and(q_t *r, const q_t *a, const q_t *b) { return qmatrix_apply_binary(r, a, b, qand); }
int qmatrix_or (q_t *r, const q_t *a, const q_t *b) { return qmatrix_apply_binary(r, a, b, qor); }
int qmatrix_xor(q_t *r, const q_t *a, const q_t *b) { return qmatrix_apply_binary(r, a, b, qxor); }

int qmatrix_scalar_add(q_t *r, const q_t *a, const q_t scalar) { return qmatrix_apply_scalar(r, a, qadd, scalar); }
int qmatrix_scalar_sub(q_t *r, const q_t *a, const q_t scalar) { return qmatrix_apply_scalar(r, a, qsub, scalar); }
int qmatrix_scalar_mul(q_t *r, const q_t *a, const q_t scalar) { return qmatrix_apply_scalar(r, a, qmul, scalar); }
int qmatrix_scalar_div(q_t *r, const q_t *a, const q_t scalar) { return qmatrix_apply_scalar(r, a, qdiv, scalar); }
int qmatrix_scalar_mod(q_t *r, const q_t *a, const q_t scalar) { return qmatrix_apply_scalar(r, a, qmod, scalar); }
int qmatrix_scalar_rem(q_t *r, const q_t *a, const q_t scalar) { return qmatrix_apply_scalar(r, a, qrem, scalar); }
int qmatrix_scalar_and(q_t *r, const q_t *a, const q_t scalar) { return qmatrix_apply_scalar(r, a, qand, scalar); }
int qmatrix_scalar_or (q_t *r, const q_t *a, const q_t scalar) { return qmatrix_apply_scalar(r, a, qor,  scalar); }
int qmatrix_scalar_xor(q_t *r, const q_t *a, const q_t scalar) { return qmatrix_apply_scalar(r, a, qxor, scalar); }

int qmatrix_is_square(const q_t *m) {
	assert(m);
	assert(qmatrix_is_valid(m));
	return m[COLUMN] == m[ROW];
}

int qmatrix_identity(q_t *r) {
	assert(r);
	assert(qmatrix_is_valid(r));
	if (!qmatrix_is_square(r))
		return -1;
	q_t *mr = &r[DATA];
	const size_t length = r[ROW];
	for (size_t i = 0; i < length; i++)
		for (size_t j = 0; j < length; j++)
			mr[i*length + j] = i == j ? QINT(1) : QINT(0);
	return 0;
}

int qmatrix_copy(q_t *r, const q_t *a)  { 
	assert(r);
	assert(qmatrix_is_valid(r));
	assert(a);
	assert(qmatrix_is_valid(a));
	const size_t arows = a[ROW], acolumns = a[COLUMN];
	const size_t copy  = arows * acolumns * sizeof (q_t);
	if ((arows && acolumns) && (copy < arows || copy < acolumns))
		return -1;
	if (qmatrix_resize(r, arows, acolumns) < 0)
		return -1;
	memcpy(&r[DATA], &a[DATA], copy);
	return 0;
}

q_t qmatrix_trace(const q_t *m) {
	assert(m);
	assert(qmatrix_is_square(m));
	const size_t length = m[ROW];
	const q_t *mm = &m[DATA];
	q_t tr = QINT(0);
	for (size_t i = 0; i < length; i++)
		for (size_t j = 0; j < length; j++)
			if (i == j)
				tr = qadd(tr, mm[i*length + j]);
	return tr;
}

q_t qmatrix_equal(const q_t *a, const q_t *b) {
	assert(a);
	assert(qmatrix_is_valid(a));
	assert(b);
	assert(qmatrix_is_valid(b));
	const size_t arow = a[ROW], acolumn = a[COLUMN];
	const size_t brow = b[ROW], bcolumn = b[COLUMN];
	const q_t *ma = &a[DATA];
	const q_t *mb = &a[DATA];
	if (a == b)
		return QINT(1);
	if (arow != brow && acolumn != bcolumn)
		return QINT(0);
	return !memcmp(ma, mb, sizeof(q_t) * arow * brow);
}

static q_t determine(const q_t *m, const size_t length) {
	assert(m);
	if (length == 1)
		return m[0];
	if (length == 2)
		return qsub(qmul(m[0], m[3]), qmul(m[1], m[2]));
	size_t co1 = 0, co2 = 0;
	q_t det = QINT(0), sgn = QINT(1);
	q_t co[length*length]; /* This should really be passed in */
	for (size_t i = 0; i < length; i++) {
		for (size_t j = 0; j < length; j++)
			for (size_t k = 0; k < length; k++)
				if (j && k != i) {
					co[co1*length + co2] = m[j*length + k];
					if (++co2 > (length - 2)) {
						co1++;
						co2 = 0;
					}
				}
		det = qadd(det, qcopysign(qmul(m[(0*length) + i], determine(co, length - 1)), sgn));
		sgn = qnegate(sgn);	
	}
	return det;
}

q_t qmatrix_determinant(const q_t *m) {
	assert(m);
	assert(qmatrix_is_square(m));
	assert(m[ROW] < 16);
	const size_t length = m[ROW];
	const q_t *mm = &m[DATA];
	return determine(mm, length);
}

int qmatrix_transpose(q_t *r, const q_t *m) {
	assert(r);
	assert(qmatrix_is_valid(r));
	assert(m);
	assert(qmatrix_is_valid(m));
	q_t *mr = &r[DATA];
	const q_t *mm = &m[DATA];
	const size_t mrows = m[ROW], mcolumns = m[COLUMN];
	const size_t msize = mrows * mcolumns;
	const size_t rsize = r[LENGTH];
	if (msize > rsize)
		return -1;
	for (size_t i = 0; i < mrows; i++)
		for (size_t j = 0; j < mcolumns; j++)
			mr[i*mcolumns + j] = mm[j*mcolumns + i];
	r[ROW]    = mcolumns;
	r[COLUMN] = mrows;
	return 0;
}

int qmatrix_mul(q_t *r, const q_t *a, const q_t *b) {
	assert(a);
	assert(qmatrix_is_valid(a));
	assert(b);
	assert(qmatrix_is_valid(b));
	assert(r);
	assert(qmatrix_is_valid(r));
	q_t *mr = &r[DATA];
	const q_t *ma = &a[DATA], *mb = &b[DATA];
	const size_t arows = a[ROW], acolumns = a[COLUMN];
	const size_t brows = b[ROW], bcolumns = b[COLUMN];
	if (acolumns != brows)
		return -1;
	if (qmatrix_resize(r, arows, bcolumns) < 0)
		return -1;
	for (size_t i = 0; i < arows; i++)
		for (size_t j = 0; j < bcolumns; j++) {
			q_t s = QINT(0);
			for (size_t k = 0; k < brows; k++)
				s = qadd(s, qmul(ma[i*acolumns + k], mb[k*bcolumns + j]));
			mr[i*arows + j] = s;
		}
	return 0;
}

static int addchar(char **str, size_t *length, const int ch) {
	assert(str && *str);
	assert(length);
	if (!length)
		return -1;
	char *s = *str;
	*s++ = ch;
	*str = s;
	*length -= 1;
	return 0;
}

static int addstr(char **str, size_t *length, char *addme) {
	assert(str && *str);
	assert(length);
	assert(addme);
	const size_t sz = strlen(addme);
	for (size_t i = 0; i < sz; i++)
		if (addchar(str, length, addme[i]) < 0)
			return -1;
	return 0;
}

int qmatrix_sprintb(const q_t *m, char *str, size_t length, unsigned base) {
	assert(str);
	assert(m);
       	const q_t *mm = &m[DATA];
	const size_t rows = m[ROW], columns = m[COLUMN];
	if (base < 2 || base > 36)
		return -1;
	if (!qmatrix_is_valid(m))
		return addstr(&str, &length, "[ INVALID ]");
	if (addstr(&str, &length, "[ ") < 0)
		return -1;
	for (size_t i = 0; i < rows; i++) {
		for (size_t j = 0; j < columns; j++) {
			const int r = qsprintb(mm[i*columns + j], str, length, base);
			if (r < 0)
				return -1;
			if ((length - r) > length)
				return -1;
			length -= r;
			str    += r;
			if (rows)
				if (addchar(&str, &length, columns && j < (columns - 1) ? ',' : i < rows - 1 ? ';' : ' ') < 0)
					return -1;
			if ((columns && j < (columns - 1)) || (i < (rows - 1)))
				if (addchar(&str, &length, ' ') < 0)
					return -1;
		}
	}
	if (addchar(&str, &length, ']') < 0)
		return -1;
	return 0;
}

size_t qmatrix_string_length(const q_t *m) {
	assert(m);
	if (!qmatrix_is_valid(m))
		return 128; /* space for invalid matrix message */
	const size_t msize = m[LENGTH];
	const size_t r = (msize * 
			(32 /*max length if base 2 used)*/ 
			+ 2 /* '-' and '.' */
			+ 2 /* space and comma/semi colon separator */
			)) + 16 /* space for extra formatting */;
	return r;
}

/* See <https://github.com/jamesbowman/sincos> 
 * and "Math Toolkit for Real-Time Programming" by Jack Crenshaw 
 *
 * The naming of these functions ('furman_') is incorrect, they do their
 * computation on numbers represented in Furmans but they do not use a 'Furman
 * algorithm'. As I do not have a better name, the name shall stick. */
static int16_t _sine(const int16_t y) {
	const int16_t s1 = 0x6487, s3 = -0x2953, s5 = 0x04f8;
	const int16_t z = arshift((int32_t)y * y, 12);
	int16_t prod = arshift((int32_t)z * s5, 16);
	int16_t sum = s3 + prod;
	prod = arshift((int32_t)z * sum, 16);
	sum = s1 + prod;
	return arshift((int32_t)y * sum,  13);
}

static int16_t _cosine(int16_t y) {
	const int16_t c0 = 0x7fff, c2 = -0x4ee9, c4 = 0x0fbd;
	const int16_t z = arshift((int32_t)y * y, 12);
	int16_t prod = arshift((int32_t)z * c4,  16);
	const int16_t sum = c2 + prod;
	prod = arshift((int32_t)z * sum, 15);
	return c0 + prod;
}

int16_t furman_sin(int16_t x) {
	const int16_t n = 3 & arshift(x + 0x2000, 14);
	x -= n << 14;
	const int16_t r = (n & 1) ? _cosine(x) : _sine(x);
	return (n & 2) ? -r : r;
}

int16_t furman_cos(int16_t x) {
	return furman_sin(x + 0x4000);
}

/* expression evaluator */

enum { ASSOCIATE_NONE, ASSOCIATE_LEFT, ASSOCIATE_RIGHT, };
enum { LEX_NUMBER, LEX_OPERATOR, LEX_END, };

int qexpr_init(qexpr_t *e) {
	assert(e);
	e->lpar   = qop("(");
	e->rpar   = qop(")");
	e->negate = qop("negate");
	e->minus  = qop("-");
	e->initialized = 1;
	assert(e->lpar && e->rpar && e->negate && e->minus);
	return 0;
}

static int error(qexpr_t *e, const char *fmt, ...) {
	assert(e);
	assert(fmt);
	if (e->error)
		return 0;
	va_list ap;
	va_start(ap, fmt);
	(void)vsnprintf(e->error_string, sizeof (e->error_string), fmt, ap);
	va_end(ap);
	e->error = -1;
	return -QINT(1);
}

static q_t numberify(const char *s) {
	assert(s);
	q_t q = 0;
	(void) qconv(&q, s);
	return q;
}

static q_t qbase(q_t b) {
	int nb = qtoi(b);
	if (nb < 2 || nb > 36)
		return -QINT(1);
	qconf.base = nb;
	return b;
}

static q_t qplaces(q_t places) {
	/* TODO: Bounds checks given base */
	qconf.dp = qtoi(places);
	return places;
}

static q_t check_div0(qexpr_t *e, q_t a, q_t b) {
	assert(e);
	UNUSED(a);
	if (!b)
		return error(e, "division by zero");
	return QINT(0);
}

static q_t check_nlz(qexpr_t *e, q_t a) { // Not Less Zero
	assert(e);
	if (qless(a, QINT(0)))
		return error(e, "negative argument");
	return QINT(0);
}

static q_t check_nlez(qexpr_t *e, q_t a) { // Not Less Equal Zero
	assert(e);
	if (qeqless(a, QINT(0)))
		return error(e, "negative or zero argument");
	return QINT(0);
}

static q_t check_nlo(qexpr_t *e, q_t a) { // Not less than one
	assert(e);
	if (qless(a, QINT(1)))
		return error(e, "out of range [1, INF]");
	return QINT(0);
}

static q_t check_alo(qexpr_t *e, q_t a) {
	assert(e);
	if (qmore(qabs(a), QINT(1)))
		return error(e, "out of range [-1, 1]");
	return QINT(0);
}

const qoperations_t *qop(const char *op) {
	assert(op);
	static const qoperations_t ops[] = {
		/* Binary Search Table: Use 'LC_ALL="C" sort -k 2 < table' to sort this */
		/* name         function                       check function        precedence arity left/right-assoc hidden */     
		{  "!",         .eval.unary   =  qnot,         .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "!=",        .eval.binary  =  qunequal,     .check.binary  =  NULL,        2,  2,  ASSOCIATE_LEFT,   0,  },
		{  "%",         .eval.binary  =  qrem,/*!*/    .check.binary  =  check_div0,  3,  2,  ASSOCIATE_LEFT,   0,  },
		{  "&",         .eval.binary  =  qand,         .check.binary  =  NULL,        2,  2,  ASSOCIATE_LEFT,   0,  },
		{  "(",         .eval.unary   =  NULL,         .check.unary   =  NULL,        0,  0,  ASSOCIATE_NONE,   0,  },
		{  ")",         .eval.unary   =  NULL,         .check.unary   =  NULL,        0,  0,  ASSOCIATE_NONE,   0,  },
		{  "*",         .eval.binary  =  qmul,         .check.binary  =  NULL,        3,  2,  ASSOCIATE_LEFT,   0,  },
		{  "+",         .eval.binary  =  qadd,         .check.binary  =  NULL,        2,  2,  ASSOCIATE_LEFT,   0,  },
		{  "-",         .eval.binary  =  qsub,         .check.binary  =  NULL,        2,  2,  ASSOCIATE_LEFT,   0,  },
		{  "/",         .eval.binary  =  qdiv,         .check.binary  =  check_div0,  3,  2,  ASSOCIATE_LEFT,   0,  },
		{  "<",         .eval.binary  =  qless,        .check.binary  =  NULL,        2,  2,  ASSOCIATE_LEFT,   0,  },
		{  "<<",        .eval.binary  =  qlls,         .check.binary  =  NULL,        4,  2,  ASSOCIATE_RIGHT,  0,  },
		{  "<=",        .eval.binary  =  qeqless,      .check.binary  =  NULL,        2,  2,  ASSOCIATE_LEFT,   0,  },
		{  "==",        .eval.binary  =  qequal,       .check.binary  =  NULL,        2,  2,  ASSOCIATE_LEFT,   0,  },
		{  ">",         .eval.binary  =  qmore,        .check.binary  =  NULL,        2,  2,  ASSOCIATE_LEFT,   0,  },
		{  ">=",        .eval.binary  =  qeqmore,      .check.binary  =  NULL,        2,  2,  ASSOCIATE_LEFT,   0,  },
		{  ">>",        .eval.binary  =  qlrs,         .check.binary  =  NULL,        4,  2,  ASSOCIATE_RIGHT,  0,  },
		{  "^",         .eval.binary  =  qxor,         .check.binary  =  NULL,        2,  2,  ASSOCIATE_LEFT,   0,  },
		{  "_div",      .eval.binary  =  qcordic_div,  .check.binary  =  NULL,        5,  2,  ASSOCIATE_RIGHT,  1,  },
		{  "_exp",      .eval.unary   =  qcordic_exp,  .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  1,  },
		{  "_ln",       .eval.unary   =  qcordic_ln,   .check.unary   =  check_nlez,  5,  1,  ASSOCIATE_RIGHT,  1,  },
		{  "_mul",      .eval.binary  =  qcordic_mul,  .check.binary  =  NULL,        5,  2,  ASSOCIATE_RIGHT,  1,  },
		{  "_sqrt",     .eval.unary   =  qcordic_sqrt, .check.unary   =  check_nlz,   5,  1,  ASSOCIATE_RIGHT,  1,  },
		{  "abs",       .eval.unary   =  qabs,         .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "acos",      .eval.unary   =  qacos,        .check.unary   =  check_alo,   5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "acosh",     .eval.unary   =  qacosh,       .check.unary   =  check_nlo,   5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "arshift",   .eval.binary  =  qars,         .check.binary  =  NULL,        4,  2,  ASSOCIATE_RIGHT,  1,  },
		{  "asin",      .eval.unary   =  qasin,        .check.unary   =  check_alo,   5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "asinh",     .eval.unary   =  qasinh,       .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "atan",      .eval.unary   =  qatan,        .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "atan2",     .eval.binary  =  qatan2,       .check.binary  =  NULL,        5,  2,  ASSOCIATE_RIGHT,  1,  },
		{  "atanh",     .eval.unary   =  qatanh,       .check.unary   =  check_alo,   5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "base",      .eval.unary   =  qbase,        .check.unary   =  NULL,        2,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "ceil",      .eval.unary   =  qceil,        .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "copysign",  .eval.binary  =  qcopysign,    .check.binary  =  NULL,        4,  2,  ASSOCIATE_RIGHT,  1,  },
		{  "cos",       .eval.unary   =  qcos,         .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "cosh",      .eval.unary   =  qcosh,        .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "cot",       .eval.unary   =  qcot,         .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "deg2rad",   .eval.unary   =  qdeg2rad,     .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "even?",     .eval.unary   =  qiseven,      .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "exp",       .eval.unary   =  qexp,         .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "floor",     .eval.unary   =  qfloor,       .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "hypot",     .eval.binary  =  qhypot,       .check.binary  =  NULL,        5,  2,  ASSOCIATE_RIGHT,  0,  },
		{  "int?",      .eval.unary   =  qisinteger,   .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "log",       .eval.unary   =  qlog,         .check.unary   =  check_nlez,  5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "lshift",    .eval.binary  =  qlls,         .check.binary  =  NULL,        4,  2,  ASSOCIATE_RIGHT,  1,  },
		{  "max",       .eval.binary  =  qmax,         .check.binary  =  NULL,        5,  2,  ASSOCIATE_RIGHT,  1,  },
		{  "min",       .eval.binary  =  qmin,         .check.binary  =  NULL,        5,  2,  ASSOCIATE_RIGHT,  1,  },
		{  "mod",       .eval.binary  =  qmod,         .check.binary  =  check_div0,  3,  2,  ASSOCIATE_LEFT,   0,  },
		{  "neg?",      .eval.unary   =  qisnegative,  .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "negate",    .eval.unary   =  qnegate,      .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "odd?",      .eval.unary   =  qisodd,       .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "places",    .eval.unary   =  qplaces,      .check.unary   =  NULL,        2,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "pos?",      .eval.unary   =  qispositive,  .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "pow",       .eval.binary  =  qpow,         .check.binary  =  NULL,        5,  2,  ASSOCIATE_RIGHT,  0,  },
		{  "rad2deg",   .eval.unary   =  qrad2deg,     .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "rem",       .eval.binary  =  qrem,         .check.binary  =  check_div0,  3,  2,  ASSOCIATE_LEFT,   0,  },
		{  "round",     .eval.unary   =  qround,       .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "rshift",    .eval.binary  =  qlrs,         .check.binary  =  NULL,        4,  2,  ASSOCIATE_RIGHT,  1,  },
		{  "sign",      .eval.unary   =  qsign,        .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "signum",    .eval.unary   =  qsignum,      .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "sin",       .eval.unary   =  qsin,         .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "sinh",      .eval.unary   =  qsinh,        .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "sqrt",      .eval.unary   =  qsqrt,        .check.unary   =  check_nlz,   5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "tan",       .eval.unary   =  qtan,         .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "tanh",      .eval.unary   =  qtanh,        .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "trunc",     .eval.unary   =  qtrunc,       .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
		{  "|",         .eval.binary  =  qor,          .check.binary  =  NULL,        2,  2,  ASSOCIATE_LEFT,   0,  },
		{  "~",         .eval.unary   =  qinvert,      .check.unary   =  NULL,        5,  1,  ASSOCIATE_RIGHT,  0,  },
	};
	const size_t length = (sizeof ops / sizeof ops[0]);
	size_t l = 0, r = length - 1;
	while (l <= r) { // Iterative Binary Search
		size_t m = l + ((r - l)/2u);
		assert (m < length);
		const int comp = strcmp(ops[m].name, op);
		if (comp == 0)
			return &ops[m];
		if (comp < 0)
			l = m + 1;
		else
			r = m - 1;
	}
	return NULL;
}

static int number_push(qexpr_t *e, q_t num) {
	assert(e);
	if (e->error)
		return -1;
	if (e->numbers_count > (e->numbers_max - 1)) {
		error(e, "number stack overflow");
		return -1;
	}
	e->numbers[e->numbers_count++] = num;
	return 0;
}

static q_t number_pop(qexpr_t *e) {
	assert(e);
	if (e->error)
		return -1;
	if (!(e->numbers_count)) {
		error(e, "number stack empty");
		return -1; /* error handled elsewhere */
	}
	return e->numbers[--(e->numbers_count)];
}

static int op_push(qexpr_t *e, const qoperations_t *op) {
	assert(e);
	assert(op);
	if (e->error)
		return -1;
	if (e->ops_count > (e->ops_max - 1)) {
		error(e, "operator stack overflow");
		return -1;
	}
	e->ops[e->ops_count++] = op;
	return 0;
}

int qexpr_error(qexpr_t *e) {
	assert(e);
	assert(e->initialized);
	return e->error;
}

q_t qexpr_result(qexpr_t *e) {
	assert(e);
	assert(e->initialized);
	assert(e->error == 0);
	assert(e->numbers_count == 1);
	return e->numbers[0];
}

static const qoperations_t *op_pop(qexpr_t *e) {
	assert(e);
	if (e->error)
		return NULL;
	if (!(e->ops_count)) {
		error(e, "operator stack empty");
		return NULL;
	}
	return e->ops[--(e->ops_count)];
}

static int op_eval(qexpr_t *e) {
	assert(e);
	const qoperations_t *pop = op_pop(e);
	if (!pop)
		return -1;
	const q_t a = number_pop(e);
	const int exists = pop->arity == 1 ? BOOLIFY(pop->eval.unary) : BOOLIFY(pop->eval.binary);
	if (!exists) {
		error(e, "syntax error");
		return -1;
	}
	if (pop->arity == 1) {
		if (pop->check.unary && pop->check.unary(e, a) < 0) {
			error(e, "unary check failed");
			return -1;
		}
		return number_push(e, pop->eval.unary(a));
	}
	const q_t b = number_pop(e);
	if (pop->check.binary && pop->check.binary(e, b, a)) {
		error(e, "binary check failed");
		return -1;
	}

	return number_push(e, pop->eval.binary(b, a));
}

static int shunt(qexpr_t *e, const qoperations_t *op) {
	assert(e);
	assert(op);
	if (op == e->lpar) {
		return op_push(e, op);
	} else if (op == e->rpar) {
		while (e->ops_count && e->ops[e->ops_count - 1] != e->lpar)
			if (op_eval(e) < 0 || e->error)
				break;
		const qoperations_t *pop = op_pop(e);
		if (!pop || (pop != e->lpar)) {
			e->error = 0; /* clear error so following error is printed */
			error(e, "expected \"(\"");
			return -1;
		}
		return 0;
	} else if (op->assocativity == ASSOCIATE_RIGHT) {
		while (e->ops_count && op->precedence < e->ops[e->ops_count - 1]->precedence)
			if (op_eval(e) < 0 || e->error)
				break;
	} else {
		while (e->ops_count && op->precedence <= e->ops[e->ops_count - 1]->precedence)
			if (op_eval(e) < 0 || e->error)
				break;
	}
	return op_push(e, op);
}

static int variable_name_is_valid(const char *n) {
	assert(n);
	if (!isalpha(*n) && !(*n == '_'))
		return 0;
	for (n++; *n; n++)
		if (!isalnum(*n) && !(*n == '_'))
			return 0;
	return 1;
}

static qvariable_t *variable_lookup(qexpr_t *e, const char *name) {
	assert(e);
	assert(name);
	for (size_t i = 0; i < e->vars_max; i++) {
		qvariable_t *v = e->vars[i];
		assert(v->name);
		assert(variable_name_is_valid(v->name));
		if (!strcmp(v->name, name))
			return v;
	}
	return NULL;
}

static int lex(qexpr_t *e, const char **expr) {
	assert(e);
	assert(expr && *expr);
	int r = 0;
	const char *s = *expr;
	qvariable_t *v = NULL;
	e->id_count = 0;
	e->number = 0;
	e->op = NULL;
	memset(e->id, 0, sizeof (e->id));
	for (; *s && isspace(*s); s++)
		;
	if (!(*s))
		return LEX_END;
	if (isalpha(*s) || *s == '_') {
		for (; e->id_count < sizeof(e->id) && *s && (isalnum(*s) || *s == '_');)
			e->id[e->id_count++] = *s++;
		if ((v = variable_lookup(e, e->id))) {
			e->number = v->value;
			r = LEX_NUMBER;
		} else if ((e->op = qop(e->id))) {
			r = LEX_OPERATOR;
		} else {
			r = -1;
		}
	} else {
		if (ispunct(*s)) {
			const qoperations_t *op1 = NULL, *op2 = NULL;
			int set = 0;
			e->id[e->id_count++] = *s++;
			op1 = qop(e->id);
			if (*s && ispunct(*s)) {
				set = 1;
				e->id[e->id_count++] = *s++;
				op2 = qop(e->id);
			}
			r = (op1 || op2) ? LEX_OPERATOR : -1;
			e->op = op2 ? op2 : op1;
			if (e->op == op1 && set) {
				s--;
				e->id_count--;
				e->id[1] = 0;
			}
		} else if (isdigit(*s)) {
			r = LEX_NUMBER;
			int dot = 0;
			for (; e->id_count < sizeof(e->id) && *s; s++) {
				const int ch = *s;
				if (!(isdigit(ch) || (ch == '.' && !dot)))
					break;
				e->id[e->id_count++] = ch;
				if (ch == '.')
					dot = 1;
			}
			e->number = numberify(e->id);
		} else {
			r = -1;
		}
	}
	/*printf("id(%d) %d => %s\n", (int)(s - *expr), r, e->id);*/
	*expr = s;
	return r;
}

int qexpr(qexpr_t *e, const char *expr) {
	assert(e);
	assert(expr);
	int firstop = 1;
	const qoperations_t *previous = NULL;
	if (e->initialized) {
		memset(e->error_string, 0, sizeof (e->error_string));
		e->error = 0;
		e->ops_count = 0;
		e->numbers_count = 0;
		e->initialized = 1;
	}
	for (int l = 0; l != LEX_END && !(e->error);) {
		switch ((l = lex(e, &expr))) {
		case LEX_NUMBER:   
			number_push(e, e->number); 
			previous = NULL; 
			firstop = 0;
			break;
		case LEX_OPERATOR: {
			const qoperations_t *op = e->op;
			if (CONFIG_Q_HIDE_FUNCS && op->hidden) {
				error(e, "unknown operator \"%s\"", op->name);
				goto end;
			}
			if (firstop || (previous && previous != e->rpar)) {
				if (e->op == e->minus) {
					op = e->negate;
				} else if (e->op->arity == 1) {
					/* do nothing */
				} else if (e->op != e->lpar) {
					assert(e->op);
					error(e, "invalid use of \"%s\"", e->op->name);
					goto end;
				}
			}
			shunt(e, op); 
			previous = op; 
			firstop = 0;
			break;
		}
		case LEX_END: break;
		default:
			error(e, "invalid symbol: %s", e->id);
			l = LEX_END;
		}
	}
	while (e->ops_count)
		if (op_eval(e) < 0 || e->error)
			break;
	if (e->numbers_count != 1) {
		error(e, "invalid expression: %d", e->numbers_count);
		return -1;
	}
	implies(e->error == 0, e->numbers_count == 1);
end:
	return e->error == 0 ? 0 : -1;
}