import sys, os, imp # Make sure autoclutter can be found even though it isn't installed yet. file, path, descr = imp.find_module("template") template = imp.load_module("template", file, path, descr) # import template """This program generates multiple c source code files It handles the tedium of all the repetitive code dealing with types and particularly combinations of types with types and types with functions. $Id: codegenerator.py,v 1.46 2004/03/04 22:34:01 jaytmiller Exp $ """ #*********************************************************************# # # # DATA SECTION # # # #*********************************************************************# # Of course, the warning below does not apply to this file! _HEADER = \ ''' /* W W AAA RRRR N N III N N GGG !!! ** W W A A R R NN N I NN N G G !!! ** W W W AAAAA RRRR N N N I N N N G ! ** W W W A A R R N NN I N NN G GG ** W W A A R R N N III N N GGG !!! ** ** WARNING: This file is program generated by codegenerator.py. ** ** DO NOT EDIT THIS FILE! Any changes made to this file will be lost! */ #include #include #include "libnumarray.h" static PyObject *_Error; ''' _TYPE_SEPARATOR = \ ''' /****************** *******************/ ''' AS_PyVALUE_TEMPLATE = \ ''' static PyObject *asPyValue(void *data) { return Py_BuildValue(, *(( *) data)); } SELF_CHECKED_CFUNC_DESCR(asPyValue, CFUNC_AS_PY_VALUE); ''' COMPLEX_AS_PyVALUE_TEMPLATE = \ ''' static PyObject *asPyValue(void *data) { return PyComplex_FromDoubles((( *) data)->r, (( *) data)->i); } SELF_CHECKED_CFUNC_DESCR(asPyValue, CFUNC_AS_PY_VALUE); ''' # From_PyVALUE uses a (relatively) backwards convention for return status. # 0 --> failure. non-zero --> success. This is actually my preferred # style as well, but *not* what the rest of numarray does. # Most ufuncs use the convention -1 for error and 0 for success. FROM_PyVALUE_TEMPLATE = \ ''' static int fromPyValue(PyObject *value, void *dataptr) { *data = ( *) dataptr; if (!PyNumber_Check(value)) return 0; else { if (PyLong_Check(value)) { *data = (PyLong_AsLongLong(value)); } else if (PyInt_Check(value)) { *data = (PyInt_AsLong(value)); } else if (PyFloat_Check(value)) { *data = (PyFloat_AsDouble(value)); } else if (PyComplex_Check(value)) { *data = (PyComplex_RealAsDouble(value)); } else { return 0; } if (PyErr_Occurred()) return 0; else return 1; } } SELF_CHECKED_CFUNC_DESCR(fromPyValue, CFUNC_FROM_PY_VALUE); ''' COMPLEX_FROM_PyVALUE_TEMPLATE = \ ''' static int fromPyValue(PyObject *value, void *dataptr) { *data = ( *) dataptr; if (!PyNumber_Check(value)) return 0; else { if (PyLong_Check(value)) { data->r = PyLong_AsLong(value); data->i = 0; } else if (PyInt_Check(value)) { data->r = PyInt_AsLong(value); data->i = 0; } else if (PyFloat_Check(value)) { data->r = PyFloat_AsDouble(value); data->i = 0; } else if (PyComplex_Check(value)) { data->r = PyComplex_RealAsDouble(value); data->i = PyComplex_ImagAsDouble(value); } else { return 0; } if (PyErr_Occurred()) return 0; else return 1; } } SELF_CHECKED_CFUNC_DESCR(fromPyValue, CFUNC_FROM_PY_VALUE); ''' CONVERSION_TEMPLATE = \ ''' static int as(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { long i; *tin = ( *) buffers[0]; *tout = ( *) buffers[1]; for (i=0; i } return 0; } UFUNC_DESCR2(as, sizeof(), sizeof()); ''' _numarray_to_numarray = { ("Complex", "Complex"): "tout->r = tin->r; tout->i = tin->i;", ("Complex", "default"): "*tout = (tin->r);", ("default", "Complex"): "tout->r = *tin; tout->i = 0;", ("default", "default"): "*tout = (*tin);" } def _complex_type(t): if t in ["Complex32", "Complex64"]: return "Complex" else: return "default" def numarray_to_numarray(t1, t2): return _numarray_to_numarray[_complex_type(t1), _complex_type(t2)] SORT_HEADER = _HEADER + \ ''' #define swap(i, j) { temp=v[i]; v[i]=v[j]; v[j]=temp; } #define wswap(i, j) { temp=v[i]; v[i]=v[j]; v[j]=temp; \ wtemp=w[i]; w[i]=w[j]; w[j]=wtemp; } ''' SORT_TEMPLATE = \ ''' #define STDC_LT(a,b) ((a) < (b)) #define STDC_LE(a,b) ((a) <= (b)) #define STDC_EQ(a,b) ((a) == (b)) void sort0( *v, long left, long right) { temp; long i, last, lastl, lastr, diff; diff = right - left; if (diff <= 0) return; /* choose the pivot randomly. */ i = left + (int) (((right-left)*1.0*rand())/(RAND_MAX+1.0)); /* Split array into values < pivot, and values > pivot. */ swap(left, i); last = left; for(i=left+1; i<=right; i++) if ((v[i], v[left])) { ++ last; swap(last, i); } swap(left, last); lastl = last-1; lastr = last+1; /* Exclude values equal to pivot from recursion */ while((left < lastl) && (v[last],v[lastl])) --lastl; while((lastr < right) && (v[last],v[lastr])) ++lastr; sort0(v, left, lastl); sort0(v, lastr, right); } static int sort(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { sort0( ( *) buffers[0], 0, niter-1); return 0; } UFUNC_DESCR1(sort, sizeof()); void asort0( *v, long *w, long left, long right) { temp; long wtemp, i, last, lastl, lastr; if (left >= right) return; /* choose the pivot randomly. */ i = left + (int) (((right-left)*1.0*rand())/(RAND_MAX+1.0)); wswap(left, i); last = left; for(i=left+1; i<=right; i++) if ((v[i], v[left])) { ++ last; wswap(last, i); } wswap(left, last); lastl = last-1; lastr = last+1; /* Exclude values equal to pivot from recursion */ while((left < lastl) && (v[last],v[lastl])) --lastl; while((lastr < right) && (v[last],v[lastr])) ++lastr; asort0(v, w, left, lastl); asort0(v, w, lastr, right); } static int asort(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { asort0( ( *) buffers[0], (long *) buffers[1], 0, niter-1); return 0; } CFUNC_DESCR(asort, CFUNC_UFUNC, CHECK_ALIGN, 0, 2, sizeof(), sizeof(long), 0, 0, 0, 0); static long search(long na, *a, v) { long i = 0; *b; while(na > 10) { long mid = na>>1; if ((v, a[mid])) na = mid; else { i += mid + 1; a += mid + 1; na = mid - 1 + (na&1); } } b = a; while(((*b, v)) && na--) ++ b; return i+(b-a); } static int searchsorted(int niter, int ninargs, int noutargs, void **buffers, long *bsizes) { maybelong nbins; *bins; *values; long *indices; maybelong i; if (NA_checkOneCBuffer("searchsorted", 1, buffers[0], bsizes[0], sizeof(maybelong))) return -1; nbins = *(maybelong *) buffers[0]; if (NA_checkOneCBuffer("searchsorted", nbins, buffers[1], bsizes[1], sizeof())) return -1; bins = ( *) buffers[1]; if (NA_checkOneCBuffer("searchsorted", niter, buffers[2], bsizes[2], sizeof())) return -1; values = ( *) buffers[2]; if (NA_checkOneCBuffer("searchsorted", niter, buffers[3], bsizes[3], sizeof(long))) return -1; indices = (long *) buffers[3]; if (NA_checkIo("searchsorted", 3, 1, ninargs, noutargs)) return -1; for(i=0; i(nbins, bins, values[i]); return 0; } SELF_CHECKED_CFUNC_DESCR(searchsorted, CFUNC_UFUNC); static int fillarray (long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { long i; start, delta; *tin; *tparams; Int8 itemsizes[2] = { sizeof(), sizeof() }; Int8 iters[2] = { 0, 2 }; if (NA_checkIo("fillarray", 1, 1, ninargs, noutargs) || NA_checkNCBuffers("fillarray", 2, niter, buffers, bsizes, itemsizes, iters)) return -1; tin = ( *) buffers[0]; tparams = ( *) buffers[1]; start = tparams[0]; delta = tparams[1]; for (i=0; i } return 0; } SELF_CHECKED_CFUNC_DESCR(fillarray, CFUNC_UFUNC); static int mxmultiply( long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { *a, *b; maybelong maxi, maxj, maxk; *r; maybelong i, j, k; if (NA_checkIo("mxmultiply", 3, 1, ninargs, noutargs)) return -1; if (NA_checkOneCBuffer("mxmultiply", 1, buffers[2], bsizes[2], sizeof(maybelong))) return -1; else { maxi = ((maybelong *)buffers[2])[0]; maxj = ((maybelong *)buffers[2])[1]; maxk = ((maybelong *)buffers[2])[2]; } if (NA_checkOneCBuffer("mxmultiply", maxi*maxk, buffers[0], bsizes[0], sizeof())) return -1; else a = ( *) buffers[0]; if (NA_checkOneCBuffer("mxmultiply", maxj*maxk, buffers[1], bsizes[1], sizeof())) return -1; else b = ( *) buffers[1]; if (NA_checkOneCBuffer("mxmultiply", maxi*maxj, buffers[3], bsizes[3], sizeof())) return -1; else r = ( *) buffers[3]; for(i=0; i s; *ap = a + i*maxk; *bp = b + j*maxk; for(k=0; k } *r = s; } return 0; } SELF_CHECKED_CFUNC_DESCR(mxmultiply, CFUNC_UFUNC); static int nonzeroCoords(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { *source; maybelong *sstride; long **output; long i, minbsize, next = 0; if (NA_checkIo("nonzeroCoords", 2, noutargs, ninargs, noutargs)) return -1; if (NA_checkOneCBuffer("nonzeroCoords", niter, buffers[0], bsizes[0], sizeof())) return -1; if (NA_checkOneCBuffer("nonzeroCoords", noutargs, buffers[1], bsizes[1], sizeof(maybelong))) return -1; /* Check alignment only. Storage optimization makes numarray shorter than niter likely, possibly even 0! */ for (i=0; i", 0, buffers[2+i], bsizes[2+i], sizeof(long))) return -1; source = ( *) buffers[0]; sstride = (maybelong *) buffers[1]; output = (long **) &buffers[2]; minbsize = bsizes[0]; for(i=0; i: bad stride[%%ld].\\n", i); return -1; } else if (bsizes[i+2] < minbsize) minbsize = bsizes[i+2]; next = 0; for(i=0; i) { long j, index = i; if (next >= minbsize) { PyErr_Format(_Error, "nonzeroCoords: insufficient index space.\\n"); return -1; } for(j=0; j, CFUNC_UFUNC); ''' sort_operator_td = { "lessthan" : "STDC_LT", "lessequal" : "STDC_LE", "equals" : "STDC_EQ", "clear" : "s = 0;", "dotstep" : "s += *ap * *bp;", "fillstep" : "*tin = start; start += delta;", "nonzero" : "source[i] != 0" } sort_complex_td = { "lessthan" : "NUM_CLT", "lessequal" : "NUM_CLE", "equals" : "NUM_CEQ", "clear" : "s.r = 0; s.i=0;", "dotstep" : "Complex64 t; NUM_CMUL(*ap, *bp, t); NUM_CADD(s, t, s);", "fillstep" : "NUM_CASS(*tin, start); NUM_CADD(start, delta, start);", "nonzero" : "((source[i].r !=0) || (source[i].i != 0))" } BYTES_HEADER = _HEADER + \ ''' #include #define NA_ACOPYN(i, o) memcpy(o, i, N) /* The following is used to copy nbytes of data for each element. ** ** As such it can be used to align any sort of data provided the ** ** output pointers used are aligned */ static int copyNbytes(long dim, long nbytes, maybelong *niters, void *input, long inboffset, maybelong *inbstrides, void *output, long outboffset, maybelong *outbstrides) { long i, j; char *tin = (char *) input + inboffset; char *tout = (char *) output + outboffset; if (dim == 0) { for (i=0; i=0; i--) { otemp = PySequence_GetItem(nitersObj, i); if (PyInt_Check(otemp)) ltemp = PyInt_AsLong(otemp); else if (PyLong_Check(otemp)) ltemp = PyLong_AsLong(otemp); else return PyErr_Format(_Error, "copyToString: non-integer shape element"); nelements *= ltemp; niters[nniters-i-1] = ltemp; Py_DECREF(otemp); otemp = PySequence_GetItem(inbstridesObj, i); if (PyInt_Check(otemp)) inbstrides[nniters-i-1] = PyInt_AsLong(otemp); else if (PyLong_Check(otemp)) inbstrides[nniters-i-1] = PyLong_AsLong(otemp); else return PyErr_Format(_Error, "copyToString: non-integer stride element"); Py_DECREF(otemp); } if (!nelements) return PyString_FromStringAndSize("", 0); outbstrides[0] = nbytes; for (i=1; i= max) \ i -= max; static int takeNbytes(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { maybelong i, cMode, N; maybelong *scatteredstrides, *scatteredshape, **indices; char *gathered, *scattered; maybelong nindices = ninargs-4, outi = ninargs+noutargs-1; if (NA_checkIo("takeNbytes", 4, 1, MIN(ninargs, 4), noutargs)) return -1; if (nindices == 0) return 0; if (NA_checkOneCBuffer("takeNbytes", 2, buffers[0], bsizes[0], sizeof(maybelong))) return -1; else { cMode = ((maybelong *) buffers[0])[0]; N = ((maybelong *) buffers[0])[1]; } if (NA_checkOneCBuffer("takeNbytes", nindices, buffers[2], bsizes[2], sizeof(maybelong))) return -1; else { scatteredstrides = (maybelong *) buffers[2]; } if (NA_checkOneCBuffer("takeNbytes", nindices, buffers[3], bsizes[3], sizeof(maybelong))) return -1; else { scatteredshape = (maybelong *) buffers[3]; } if (NA_checkOneStriding("takeNBytes", nindices, scatteredshape, 0, scatteredstrides, bsizes[1], N, 0)) return -1; else scattered = (char *) buffers[1]; for(i=4; i= scatteredshape[j]) k = scatteredshape[j]-1; index += scatteredstrides[j]*k; } memcpy( &gathered[i*N], scattered+index, N); } break; case RAISE: for(i=0; i= scatteredshape[j]) { PyErr_Format(PyExc_IndexError, "Index[" ML_DEC "," ML_DEC "]=" ML_DEC " out of range[" ML_DEC "]", i, j, k, scatteredshape[j]); return -1; } index += scatteredstrides[j]*k; } memcpy( &gathered[i*N], scattered+index, N); } break; } return 0; } SELF_CHECKED_CFUNC_DESCR(takeNbytes, CFUNC_UFUNC); static int putNbytes(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { maybelong i, cMode, N; maybelong *scatteredstrides, *scatteredshape, **indices; char *gathered, *scattered; long nindices = ninargs-4, outi = ninargs+noutargs-1; if (nindices == 0) return 0; if (NA_checkIo("putNbytes", 4, 1, MIN(ninargs, 4), noutargs)) return -1; if (NA_checkOneCBuffer("putNbytes", 2, buffers[0], bsizes[0], sizeof(maybelong))) return -1; else { cMode = ((maybelong *) buffers[0])[0]; N = ((maybelong *) buffers[0])[1]; } if (NA_checkOneCBuffer("putNbytes", niter*N, buffers[1], bsizes[1], 1)) return -1; else gathered = (char *) buffers[1]; if (NA_checkOneCBuffer("putNbytes", nindices, buffers[2], bsizes[2], sizeof(maybelong))) return -1; else { scatteredstrides = (maybelong *) buffers[2]; } if (NA_checkOneCBuffer("putNbytes", nindices, buffers[3], bsizes[3], sizeof(maybelong))) return -1; else { scatteredshape = (maybelong *) buffers[3]; } for(i=4; i= scatteredshape[j]) k = scatteredshape[j]-1; index += scatteredstrides[j]*k; } memcpy( scattered+index, &gathered[i*N], N); } break; case RAISE: for(i=0; i= scatteredshape[j]) { PyErr_Format(PyExc_IndexError, "Index[" ML_DEC "," ML_DEC "]=" ML_DEC " out of range[" ML_DEC "]", i, j, k, scatteredshape[j]); return -1; } index += scatteredstrides[j]*k; } memcpy( scattered+index, &gathered[i*N], N); } break; } return 0; } SELF_CHECKED_CFUNC_DESCR(putNbytes, CFUNC_UFUNC); ''' COPY_TEMPLATE = \ ''' /******************************************* * * * These copy data to a contiguous buffer. * * They do not handle non-aligned data. * * Offsets and Strides are in byte units * * * *******************************************/ static int copybytes(long dim, long dummy, maybelong *niters, void *input, long inboffset, maybelong *inbstrides, void *output, long outboffset, maybelong *outbstrides) { long i; char *tin = (char *) input + inboffset; char *tout = (char *) output + outboffset; if (dim == 0) { for (i=0; i(tin, tout); tin += inbstrides[dim]; tout += outbstrides[dim]; } } else { for (i=0; ibytes(dim-1, dummy, niters, input, inboffset + i*inbstrides[dim], inbstrides, output, outboffset + i*outbstrides[dim], outbstrides); } } return 0; } STRIDING_DESCR2(copybytes, CHECK_ALIGN, , ); ''' ALIGN_TEMPLATE = \ ''' static int alignbytes(long dim, long dummy, maybelong *niters, void *input, long inboffset, maybelong *inbstrides, void *output, long outboffset, maybelong *outbstrides) { return copyNbytes(dim, , niters, input, inboffset, inbstrides, output, outboffset, outbstrides); } STRIDING_DESCR2(alignbytes, !CHECK_ALIGN, , ); ''' BYTESWAP_TEMPLATE = \ ''' /******* byteswap *****/ static int byteswap(long dim, long dummy, maybelong *niters, void *input, long inboffset, maybelong *inbstrides, void *output, long outboffset, maybelong *outbstrides) { long i; char *tin = (char *) input + inboffset; char *tout = (char *) output + outboffset; if (dim == 0) { for (i=0; i]; NA_COPY(tin, t); (t, tout); tin += inbstrides[dim]; tout += outbstrides[dim]; } } else { for (i=0; i(dim-1, dummy, niters, input, inboffset + i*inbstrides[dim], inbstrides, output, outboffset + i*outbstrides[dim], outbstrides); } } return 0; } STRIDING_DESCR2(byteswap, !CHECK_ALIGN, , ); ''' CHOOSE_TEMPLATE = \ ''' static int choosebytes(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { maybelong i, cMode, maxP, N, *selector; char **population, *output; int outi = ninargs + noutargs - 1; if (NA_checkIo("choosebytes", 2, 1, MIN(ninargs,2), noutargs)) return -1; if (NA_checkOneCBuffer("choosebytes", 2, buffers[0], bsizes[0], sizeof(maybelong))) return -1; else { cMode = ((maybelong *) buffers[0])[0]; N = ((maybelong *) buffers[0])[1]; } if (NA_checkOneCBuffer("choosebytes", niter, buffers[1], bsizes[1], sizeof(maybelong))) return -1; else selector = (maybelong *) buffers[1]; if (ninargs-2 == 0) return 0; else maxP = ninargs-2; for(i=2; ibytes", niter, buffers[i], bsizes[i], )) return -1; population = (char **) &buffers[2]; if (NA_checkOneCBuffer("choosebytes", niter, buffers[outi], bsizes[outi], )) return -1; else output = (char *) buffers[outi]; if (maxP == 0) return 0; switch(cMode) { case WRAPPED: for(i=0; i(&population[j][i*], &output[i*]); } break; default: case CLIPPED: for(i=0; i= maxP) j = maxP-1; NA_ACOPY(&population[j][i*], &output[i*]); } break; } return 0; } SELF_CHECKED_CFUNC_DESCR(choosebytes, CFUNC_UFUNC); ''' BYTES_TEMPLATE = ( COPY_TEMPLATE + ALIGN_TEMPLATE + BYTESWAP_TEMPLATE + CHOOSE_TEMPLATE ) _METHODS_DEF = \ ''' static PyMethodDef _Methods[] = { \t{NULL, NULL} /* Sentinel */ }; ''' ADDMETHOD_TEMPLATE = \ '''\t{ "%s", %s, METH_VARARGS}, ''' _TAIL = \ ''' /* platform independent*/ #ifdef MS_WIN32 __declspec(dllexport) #endif void init_(void) { PyObject *m, *d; m = Py_InitModule("_", _Methods); d = PyModule_GetDict(m); _Error = PyErr_NewException("_.error", NULL, NULL); PyDict_SetItemString(d, "error", _Error); import_libnumarray(); PyDict_SetItemString(d, "functionDict", init_funcDict()); } ''' #*********************************************************************# # data for _ufuncmodule.c # #*********************************************************************# UFUNC_HEADER = \ ''' #include #include #include #include "libnumarray.h" #ifdef MS_WIN32 #pragma warning(once : 4244) #endif #define logical_and(arg1, arg2) (arg1 != 0) & (arg2 != 0) #define logical_or(arg1, arg2) (arg1 != 0) | (arg2 != 0) #define logical_xor(arg1, arg2) ((arg1 != 0) ^ (arg2 != 0)) & 1 #define ufmaximum(arg1, arg2) (((temp1=arg1) > (temp2=arg2)) ? temp1 : temp2) #define ufminimum(arg1, arg2) (((temp1=arg1) < (temp2=arg2)) ? temp1 : temp2) static PyObject *_Error; ''' UFUNC_UNARY_TEMPLATE = \ ''' static int __vector(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { long i; *tin = ( *) buffers[0]; *tout = ( *) buffers[1]; for (i=0; i } return 0; } UFUNC_DESCR2(__vector, sizeof(), sizeof()); ''' UFUNC_VECTOR_VECTOR = \ ''' static int __vector_vector(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { long i; *tin1 = ( *) buffers[0]; *tin2 = ( *) buffers[1]; *tout = ( *) buffers[2]; for (i=0; i } return 0; } UFUNC_DESCR3(__vector_vector, sizeof(), sizeof(), sizeof()); ''' UFUNC_VECTOR_SCALAR = \ ''' static int __vector_scalar(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { long i; *tin1 = ( *) buffers[0]; tscalar = *( *) buffers[1]; *tout = ( *) buffers[2]; for (i=0; i } return 0; } UFUNC_DESCR3vs(__vector_scalar, sizeof(), sizeof(), sizeof()); ''' UFUNC_SCALAR_VECTOR = \ ''' static int __scalar_vector(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { long i; tscalar = *( *) buffers[0]; *tin2 = ( *) buffers[1]; *tout = ( *) buffers[2]; for (i=0; i } return 0; } UFUNC_DESCR3sv(__scalar_vector, sizeof(), sizeof(), sizeof()); ''' UFUNC_REDUCE = \ ''' static int __reduce(long dim, long dummy, maybelong *niters, void *input, long inboffset, maybelong *inbstrides, void *output, long outboffset, maybelong *outbstrides) { long i; *tin = ( *) ((char *) input + inboffset); *tout = ( *) ((char *) output + outboffset); net; if (dim == 0) { net = *tout; for (i=1; i *) ((char *) tin + inbstrides[dim]); } *tout = net; } else { for (i=0; i__reduce(dim-1, dummy, niters, input, inboffset + i*inbstrides[dim], inbstrides, output, outboffset + i*outbstrides[dim], outbstrides); } } return 0; } STRIDING_DESCR2(__reduce, CHECK_ALIGN, sizeof(), sizeof()); ''' UFUNC_ACCUMULATE = \ ''' static int __accumulate( long dim, long dummy, maybelong *niters, void *input, long inboffset, maybelong *inbstrides, void *output, long outboffset, maybelong *outbstrides) { long i; *tin = ( *) ((char *) input + inboffset); *tout = ( *) ((char *) output + outboffset); lastval; if (dim == 0) { for (i=1; i *) ((char *) tin + inbstrides[dim]); tout = ( *) ((char *) tout + outbstrides[dim]); } } else { for (i=0; i__accumulate(dim-1, dummy, niters, input, inboffset + i*inbstrides[dim], inbstrides, output, outboffset + i*outbstrides[dim], outbstrides); } } return 0; } STRIDING_DESCR2(__accumulate, CHECK_ALIGN, sizeof(), sizeof()); ''' UFUNC_PVECTOR_PVECTOR = \ ''' static int __vector_vector(long niter, long ninargs, long noutargs, void **buffers, long *bsizes) { long i; *tin1 = ( *) buffers[0]; *tin2 = ( *) buffers[1]; *tout = ( *) buffers[2]; for (i=0; i } return 0; } UFUNC_DESCR3(__vector_vector, sizeof(), sizeof(), sizeof()); ''' UFUNC_COMPARE_TEMPLATE = ( UFUNC_VECTOR_VECTOR + UFUNC_VECTOR_SCALAR + UFUNC_SCALAR_VECTOR ) UFUNC_BINARY_TEMPLATE = ( UFUNC_COMPARE_TEMPLATE + UFUNC_ACCUMULATE + UFUNC_REDUCE ) #*********************************************************************# # data for filling function table # #*********************************************************************# _CFUNCDICT_HEADER = \ ''' static PyObject *init_funcDict(void) { PyObject *dict; dict = PyDict_New(); ''' _ADDCFUNC_TEMPLATE = \ ''' NA_add_cfunc(dict, "%s", (void *) &%s_descr); ''' _CFUNCDICT_TAIL = \ ''' return dict; } ''' # The following templates are the most complex. There are a number of # different forms of templates, for unary and binary functions, and then # different forms for the computation line (operator, function plus # special versions for integer multiply and divide for overflow and # divide by zero checking. More may be necesary in the future. These # are defined here since most are used multiple times in the ufunc # definition table. # td stands for 'template dict' macro_td = { "operator1" :"(*tin, *tout);", "operator_vv" :"(*tin1, *tin2, *tout);", "operator_vs" :"(*tin1, tscalar, *tout);", "operator_sv" :"(tscalar, *tin2, *tout);", "operator_reduce" :"(net, *tin, net);", "operator_accumulate":"(lastval ,*tin, *tout);" } function_td = { "operator1" :"*tout = (*tin);", "operator_vv" :"*tout = (*tin1, *tin2);", "operator_vs" :"*tout = (*tin1, tscalar);", "operator_sv" :"*tout = (tscalar, *tin2);", "operator_reduce" :"net = (net, *tin);", "operator_accumulate":"*tout = (lastval ,*tin);" } mask_td = { "operator_pp" :"*tout = (tin1, tin2);", } operator_td = { "operator1" :"*tout = *tin;", "operator_vv" :"*tout = *tin1 *tin2;", "operator_vs" :"*tout = *tin1 tscalar;", "operator_sv" :"*tout = tscalar *tin2;", "operator_reduce" :"net = net *tin;", "operator_accumulate":"*tout = lastval *tin;" } int_divide_td = { "operator_vv":"*tout = ((*tin2==0) ? int_dividebyzero_error(*tin2, *tin1) : *tin1 *tin2);", "operator_vs":"*tout = ((tscalar==0) ? int_dividebyzero_error(tscalar, *tin1) : *tin1 tscalar);", "operator_sv":"*tout = ((*tin2==0) ? int_dividebyzero_error(*tin2, 0) : tscalar *tin2);", "operator_reduce":"net = ((*tin==0) ? int_dividebyzero_error(*tin, 0) : net *tin);", "operator_accumulate":"*tout = ((*tin==0) ? int_dividebyzero_error(*tin, 0) : lastval *tin);" } int_truedivide_td = { "operator_vv":"*tout = ((*tin2==0) ? int_dividebyzero_error(*tin2, *tin1) : *tin1 (double) *tin2);", "operator_vs":"*tout = ((tscalar==0) ? int_dividebyzero_error(tscalar, *tin1) : *tin1 (double) tscalar);", "operator_sv":"*tout = ((*tin2==0) ? int_dividebyzero_error(*tin2, 0) : tscalar (double) *tin2);", "operator_reduce":"net = ((*tin==0) ? int_dividebyzero_error(*tin, 0) : net (double) *tin);", "operator_accumulate":"*tout = ((*tin==0) ? int_dividebyzero_error(*tin, 0) : lastval (double) *tin);" } int_floordivide_td = { "operator_vv":"*tout = ((*tin2==0) ? int_dividebyzero_error(*tin2, *tin1) : floor(*tin1 (double) *tin2));", "operator_vs":"*tout = ((tscalar==0) ? int_dividebyzero_error(tscalar, *tin1) : floor(*tin1 (double) tscalar));", "operator_sv":"*tout = ((*tin2==0) ? int_dividebyzero_error(*tin2, 0) : floor(tscalar (double) *tin2));", "operator_reduce":"net = ((*tin==0) ? int_dividebyzero_error(*tin, 0) : floor(net (double) *tin));", "operator_accumulate":"*tout = ((*tin==0) ? int_dividebyzero_error(*tin, 0) : floor(lastval (double) *tin));" } int8_check = \ """if (temp > 127) temp = int_overflow_error(127.); if (temp < -128) temp = int_overflow_error(-128.);""" uint8_check = \ """if (temp > 255) temp = int_overflow_error(255.);""" int16_check = \ """if (temp > 32767) temp = int_overflow_error(32767.); if (temp < -32768) temp = int_overflow_error(-32768);""" uint16_check = \ """if (temp > 65535) temp = int_overflow_error(65535.);""" int32_check = \ """if (temp > 2147483647) temp = (Float64) int_overflow_error(2147483647.); if (temp < (-2147483648.)) temp = (Float64) int_overflow_error(-2147483648.);""" uint32_check = \ """if (temp > 4294967295U) temp = (Float64) int_overflow_error(4294967295.);""" int64_check = \ """if (smult64_overflow(, )) temp = (Float64) int_overflow_error(4611686018427387903.);""" uint64_check = \ """if (umult64_overflow(, )) temp = (Float64) int_overflow_error(9223372036854775807.);""" # A template used below to generate multiple templates! (since they # are all so similar. These are used by make_int_template_dict just below. intX_td = { "operator_vv": ("*tin1", "*tin2", "*tout"), "operator_vs": ("*tin1", "tscalar", "*tout"), "operator_sv": ("tscalar", "*tin2", "*tout"), "operator_reduce": ("net", "*tin", "net"), "operator_accumulate": ("lastval", "*tin", "*tout"), } intX_mult_template = """temp = (() ) % (() ); = () temp;""" def make_int_template_dict(uptype, sizestr, checkstr): td = {} for key in intX_td.keys(): td[key] = intX_mult_template % \ {"type": sizestr, "checkstr": (checkstr % { "p1":intX_td[key][0], "p2":intX_td[key][1] }), "uptype":uptype, "p1":intX_td[key][0], "p2":intX_td[key][1], "p3":intX_td[key][2], } return td #*********************************************************************# # data lists for type conversion # #*********************************************************************# # These are used by the code to generate dictionaries with the keys # defined in tdictfields and the corresponding values in typeconfig # list items. There will be one dictionary for each element in # typeconfig. It is done this way to make the table more readable # and easier to edit. def hasUInt64(): return "--hasUInt64" in sys.argv def hasFloat128(): return "--hasFloat128" in sys.argv typeconfig = [ ["Bool", "(Bool) isNonZERO", "PY_BOOL_CHAR", ""], ["Int8", "(Int8)", "PY_INT8_CHAR", ""], ["Int16", "(Int16)", "PY_INT16_CHAR", ""], ["Int32", "(Int32)", "PY_INT32_CHAR", ""], ["UInt32", "(UInt32)", "PY_UINT32_CHAR", ""], ["UInt8", "(UInt8)", "PY_UINT8_CHAR", "(Int16)"], ["UInt16", "(UInt16)", "PY_UINT16_CHAR", "(Int32)"], ["Float32","(Float32)", "PY_FLOAT32_CHAR",""], ["Float64","(Float64)", "PY_FLOAT64_CHAR",""], ["Complex32", "NUM_TO_COMPLEX", "PY_COMPLEX32_CHAR",""], ["Complex64", "NUM_TO_COMPLEX", "PY_COMPLEX64_CHAR",""], ] typeconfig.append(["Int64", "(Int64)", "PY_LONG_CHAR", ""]) if hasUInt64(): typeconfig.append(["UInt64", "(UInt64)", "PY_LONG_CHAR", ""]) if hasFloat128(): typeconfig.append(["Float128", "(Float128)", "PY_FLOAT128_CHAR", ""]) typeconfig.append(["Complex128", "NUM_TO_COMPLEX", "PY_COMPLEX128_CHAR", ""]) class ConvParams: def __init__(self, typename, typecast, pybuildchar, pycast): self.typename = typename self.typecast = typecast self.pybuildchar = pybuildchar self.pycast = pycast bytesconfig = [ ["1", "Int8"], ["2", "Int16"], ["4", "Int32"], ["8", "Float64"], ["16", "Complex64"], ]; class BytesParams: def __init__(self, size, type): self.size = size self.sizename = str(size) + "bytes" self.typename = type self.swapkind = "NA_SWAP" NBytesParams = BytesParams("N","AnyType") class ComplexBytesParams: def __init__(self, size, type): self.size = size self.sizename = type self.typename = type self.swapkind = "NA_COMPLEX_SWAP" Complex32BytesCfg = ComplexBytesParams(8, "Complex32") Complex64BytesCfg = ComplexBytesParams(16, "Complex64") #*********************************************************************# # data lists for ufunc generation # #*********************************************************************# # Some implicit rules: # Bool never returned by math functions # Bool always returned by comparison functions # Math operators (+-*/**) generally return all types, double math functions # only return float types, special purpose functions (floor, ceil, etc) # only return one kind (int or float) # Define various forms for signatures. New ufuncs may require new # signatures lists. These are used in the ufunc definition table # repeatedly. generic_operator_sigs = [ ('Bool', 'Int8'), ('Int8', 'Int8'), ('Int16', 'Int16'), ('Int32', 'Int32'), ('UInt8', 'UInt8'), ('UInt16', 'UInt16'), ('UInt32', 'UInt32'), ('Float32', 'Float32'), ('Float64', 'Float64') ] generic_mathfunction_sigs = [ ('Bool', 'Float32'), ('Int8', 'Float32'), ('Int16', 'Float32'), ('Int32', 'Float32'), ('UInt8', 'Float32'), ('UInt16', 'Float32'), ('UInt32', 'Float32'), ('Float32', 'Float32'), ('Float64', 'Float64') ] generic_comparisonfunction_sigs = [ ('Bool', 'Bool'), ('Int8', 'Bool'), ('Int16', 'Bool'), ('Int32', 'Bool'), ('UInt8', 'Bool'), ('UInt16', 'Bool'), ('UInt32', 'Bool'), ('Float32', 'Bool'), ('Float64', 'Bool') ] generic_int_sigs = [ ('Bool', 'Bool'), ('Int8', 'Int8'), ('Int16', 'Int16'), ('Int32', 'Int32'), ('UInt8', 'UInt8'), ('UInt16', 'UInt16'), ('UInt32', 'UInt32') ] truedivide_int_sigs = [ ('Bool', 'Float32'), ('Int8', 'Float32'), ('Int16', 'Float32'), ('Int32', 'Float32'), ('UInt8', 'Float32'), ('UInt16', 'Float32'), ('UInt32', 'Float32') ] generic_operator_sigs.append(('Int64', 'Int64')) generic_mathfunction_sigs.append(('Int64', 'Float64')) generic_comparisonfunction_sigs.append(('Int64', 'Bool')) generic_int_sigs.append(('Int64', 'Int64')) truedivide_int_sigs.append(('Int64', 'Float64')) if hasUInt64(): generic_operator_sigs.append(('UInt64', 'UInt64')) generic_mathfunction_sigs.append(('UInt64', 'Float64')) generic_comparisonfunction_sigs.append(('UInt64', 'Bool')) generic_int_sigs.append(('UInt64', 'UInt64')) truedivide_int_sigs.append(('UInt64', 'Float64')) generic_float_sigs = [ ('Float32', 'Float32'), ('Float64', 'Float64') ] complex_complex_sigs = [ ('Complex32', 'Complex32'), ('Complex64', 'Complex64') ] complex_real_sigs = [ ('Complex32', 'Float32'), ('Complex64', 'Float64') ] complex_bool_sigs = [ ('Complex32', 'Bool'), ('Complex64', 'Bool') ] opt_mult_decl = "Int32 temp;" opt_mult32_decl = "Float64 temp;" opt_mult64_decl = "Int64 temp;" opt_minmax_decl = " temp1, temp2;" # ============================================================================ # IMPORTANT: no <>-sugared strings below this point # translate --> %(var)s in templates seen *so far* template.sugar_dict(globals()) # ============================================================================ # Use function to define all variants of integer multiply. multiply_int8_td = make_int_template_dict("Int32", "Int8", int8_check) multiply_uint8_td = make_int_template_dict("Int32", "UInt8", uint8_check) multiply_int16_td = make_int_template_dict("Int32", "Int16", int16_check) multiply_uint16_td = make_int_template_dict("Int32", "UInt16", uint16_check) multiply_uint32_td = make_int_template_dict("Float64", "UInt32", uint32_check) multiply_int32_td = make_int_template_dict("Float64", "Int32", int32_check) multiply_int64_td = make_int_template_dict("Int64", "Int64", int64_check) multiply_uint64_td = make_int_template_dict("UInt64", "UInt64", uint64_check) # These are used by the code to generate dictionaries with the keys # defined in ufdictfields and the corresponding values in ufuncconfigs # list items. There will be one dictionary for each element in # ufuncconfigs. It is done this way to make the table more readable # and easier to edit. # Multiple entries for function names are permitted as long as the # signatures have no overlaps. # pyname ins outs form sigs optional_decls ufuncconfigs = [ ["minus", 1, 1, (operator_td, "-"), generic_operator_sigs, ""], ["add", 2, 1, (operator_td, "+"), generic_operator_sigs,""], ["subtract", 2, 1, (operator_td, "-"), generic_operator_sigs, ""], ["multiply", 2, 1, (multiply_int8_td, "*"), [('Int8', 'Int8')], opt_mult_decl], ["multiply", 2, 1, (multiply_uint8_td, "*"), [('UInt8', 'UInt8')], opt_mult_decl], ["multiply", 2, 1, (multiply_int16_td, "*"), [('Int16', 'Int16')], opt_mult_decl], ["multiply", 2, 1, (multiply_uint16_td, "*"), [('UInt16', 'UInt16')], opt_mult_decl], ["multiply", 2, 1, (multiply_int32_td, "*"), [('Int32', 'Int32')], opt_mult32_decl], ["multiply", 2, 1, (multiply_uint32_td, "*"), [('UInt32', 'UInt32')], opt_mult32_decl], ["multiply", 2, 1, (multiply_int64_td, "*"), [('Int64', 'Int64')], opt_mult64_decl], ["multiply", 2, 1, (multiply_uint64_td, "*"), [('UInt64', 'UInt64')], opt_mult64_decl], ["multiply", 2, 1, (operator_td, "*"), generic_float_sigs, ""], ["divide", 2, 1, (int_divide_td,"/"), generic_int_sigs, ""], ["divide", 2, 1, (operator_td, "/"), generic_float_sigs, ""], ["floor_divide", 2, 1, (int_floordivide_td,"/"), generic_int_sigs, ""], ["floor_divide", 2, 1, (macro_td, "NUM_FLOORDIVIDE"), generic_float_sigs, ""], ["true_divide", 2, 1, (int_truedivide_td,"/"), truedivide_int_sigs, ""], ["true_divide", 2, 1, (operator_td, "/"), generic_float_sigs, ""], ["remainder",2, 1, (int_divide_td, " % "), generic_int_sigs, ""], ["remainder",2, 1, (function_td, "fmod"), generic_float_sigs, ""], ["power", 2, 1, (function_td, "num_pow"), generic_operator_sigs, ""], ["abs", 1, 1, (function_td, "fabs"), generic_operator_sigs, ""], ["sin", 1, 1, (function_td, "sin"), generic_mathfunction_sigs, ""], ["cos", 1, 1, (function_td, "cos"), generic_mathfunction_sigs, ""], ["tan", 1, 1, (function_td, "tan"), generic_mathfunction_sigs, ""], ["arcsin", 1, 1, (function_td, "asin"), generic_mathfunction_sigs, ""], ["arccos", 1, 1, (function_td, "acos"), generic_mathfunction_sigs, ""], ["arctan", 1, 1, (function_td, "atan"), generic_mathfunction_sigs, ""], ["arctan2",2, 1, (function_td, "atan2"), generic_mathfunction_sigs, ""], ["log", 1, 1, (function_td, "num_log"), generic_mathfunction_sigs, ""], ["log10", 1, 1, (function_td, "num_log10"),generic_mathfunction_sigs, ""], ["exp", 1, 1, (function_td, "exp"), generic_mathfunction_sigs, ""], ["sinh", 1, 1, (function_td, "sinh"), generic_mathfunction_sigs, ""], ["cosh", 1, 1, (function_td, "cosh"), generic_mathfunction_sigs, ""], ["tanh", 1, 1, (function_td, "tanh"), generic_mathfunction_sigs, ""], ["arcsinh", 1, 1, (function_td, "num_asinh"), generic_mathfunction_sigs, ""], ["arccosh", 1, 1, (function_td, "num_acosh"), generic_mathfunction_sigs, ""], ["arctanh", 1, 1, (function_td, "num_atanh"), generic_mathfunction_sigs, ""], ["ieeemask", 2, 1, (mask_td, "NA_IeeeSpecial32"), [('Float32', 'Int32', 'Bool')], "", UFUNC_PVECTOR_PVECTOR, ['vector_vector'] ], ["ieeemask", 2, 1, (mask_td, "NA_IeeeSpecial64"), [('Float64', 'Int32', 'Bool')], "", UFUNC_PVECTOR_PVECTOR, ['vector_vector'] ], ["sqrt", 1, 1, (function_td, "sqrt"), generic_mathfunction_sigs, ""], ["equal", 2, 1, (operator_td, "=="), generic_comparisonfunction_sigs, ""], ["not_equal", 2, 1, (operator_td, "!="), generic_comparisonfunction_sigs, ""], ["greater", 2, 1, (operator_td, ">"), generic_comparisonfunction_sigs, ""], ["greater_equal", 2, 1, (operator_td, ">="), generic_comparisonfunction_sigs, ""], ["less", 2, 1, (operator_td, "<"), generic_comparisonfunction_sigs, ""], ["less_equal", 2, 1, (operator_td, "<="), generic_comparisonfunction_sigs, ""], ["logical_and", 2, 1, (function_td, "logical_and"), generic_comparisonfunction_sigs, ""], ["logical_or", 2, 1, (function_td, "logical_or"), generic_comparisonfunction_sigs, ""], ["logical_xor", 2, 1, (function_td, "logical_xor"), generic_comparisonfunction_sigs, ""], ["logical_not", 1, 1, (operator_td, "!"), generic_comparisonfunction_sigs, ""], ["bitwise_and", 2, 1, (operator_td, "&"), generic_int_sigs, ""], ["bitwise_or", 2, 1, (operator_td, "|"), generic_int_sigs, ""], ["bitwise_xor", 2, 1, (operator_td, "^"), generic_int_sigs, ""], ["bitwise_not", 1, 1, (operator_td, "~"), generic_int_sigs, ""], ["rshift", 2, 1, (operator_td, ">>"), generic_int_sigs, ""], ["lshift", 2, 1, (operator_td, "<<"), generic_int_sigs, ""], ["floor", 1, 1, (function_td, ""), generic_int_sigs, ""], ["floor", 1, 1, (function_td, "floor"), generic_float_sigs, ""], ["ceil", 1, 1, (function_td, ""), generic_int_sigs, ""], ["ceil", 1, 1, (function_td, "ceil"), generic_float_sigs, ""], ["maximum", 2, 1, (function_td, "ufmaximum"), generic_operator_sigs, opt_minmax_decl], ["minimum", 2, 1, (function_td, "ufminimum"), generic_operator_sigs, opt_minmax_decl], ["fabs", 1, 1, (function_td, "fabs"), generic_mathfunction_sigs, ""], ["_round", 1, 1, (function_td, "num_round"), generic_mathfunction_sigs, ""], ["hypot", 2, 1, (function_td, "hypot"), generic_mathfunction_sigs, ""], # Complex ufuncs ["minus", 1, 1, (macro_td, "NUM_CMINUS"), complex_complex_sigs, ""], ["add", 2, 1, (macro_td, "NUM_CADD"), complex_complex_sigs, ""], ["subtract", 2, 1, (macro_td, "NUM_CSUB"), complex_complex_sigs, ""], ["multiply", 2, 1, (macro_td, "NUM_CMUL"), complex_complex_sigs, ""], ["divide", 2, 1, (macro_td, "NUM_CDIV"), complex_complex_sigs, ""], ["true_divide", 2, 1, (macro_td, "NUM_CDIV"), complex_complex_sigs, ""], ["remainder", 2, 1, (macro_td, "NUM_CREM"), complex_complex_sigs, ""], ["power", 2, 1, (macro_td, "NUM_CPOW"), complex_complex_sigs, ""], ["abs", 1, 1, (function_td, "NUM_CABS"), complex_real_sigs, ""], ["sin", 1, 1, (macro_td, "NUM_CSIN"), complex_complex_sigs, ""], ["cos", 1, 1, (macro_td, "NUM_CCOS"), complex_complex_sigs, ""], ["tan", 1, 1, (macro_td, "NUM_CTAN"), complex_complex_sigs, ""], ["arcsin", 1, 1, (macro_td, "NUM_CASIN"), complex_complex_sigs, ""], ["arccos", 1, 1, (macro_td, "NUM_CACOS"), complex_complex_sigs, ""], ["arctan", 1, 1, (macro_td, "NUM_CATAN"), complex_complex_sigs, ""], ["arcsinh", 1, 1, (macro_td, "NUM_CASINH"), complex_complex_sigs, ""], ["arccosh", 1, 1, (macro_td, "NUM_CACOSH"), complex_complex_sigs, ""], ["arctanh", 1, 1, (macro_td, "NUM_CATANH"), complex_complex_sigs, ""], # ["arctan2",2, 1, (function_td, "atan2"), generic_mathfunction_sigs, ""], ["log", 1, 1, (macro_td, "NUM_CLOG"), complex_complex_sigs, ""], ["log10", 1, 1, (macro_td, "NUM_CLOG10"), complex_complex_sigs, ""], ["exp", 1, 1, (macro_td, "NUM_CEXP"), complex_complex_sigs, ""], ["sinh", 1, 1, (macro_td, "NUM_CSINH"), complex_complex_sigs, ""], ["cosh", 1, 1, (macro_td, "NUM_CCOSH"), complex_complex_sigs, ""], ["tanh", 1, 1, (macro_td, "NUM_CTANH"), complex_complex_sigs, ""], ["sqrt", 1, 1, (macro_td, "NUM_CSQRT"), complex_complex_sigs, ""], # Strictly speaking, these are implemented as macros as well, but they # return real valued (Bool) expressions rather than fill in a 3rd # Complex parameter. ["equal", 2, 1, (function_td, "NUM_CEQ"), complex_bool_sigs, ""], ["not_equal", 2, 1, (function_td, "NUM_CNE"), complex_bool_sigs, ""], ["logical_and", 2, 1, (function_td, "NUM_CLAND"), complex_bool_sigs, ""], ["logical_or", 2, 1, (function_td, "NUM_CLOR"), complex_bool_sigs, ""], ["logical_xor", 2, 1, (function_td, "NUM_CLXOR"), complex_bool_sigs, ""], ["logical_not", 1, 1, (function_td, "NUM_CLNOT"), complex_bool_sigs, ""], # ["bitwise_and", 2, 1, (operator_td, "&"), generic_int_sigs, ""], # ["bitwise_or", 2, 1, (operator_td, "|"), generic_int_sigs, ""], # ["bitwise_xor", 2, 1, (operator_td, "^"), generic_int_sigs, ""], # ["bitwise_not", 1, 1, (operator_td, "~"), generic_int_sigs, ""], # ["rshift", 2, 1, (operator_td, ">>"), generic_int_sigs, ""], # ["lshift", 2, 1, (operator_td, "<<"), generic_int_sigs, ""], ["floor", 1, 1, (macro_td, "NUM_CFLOOR"), complex_complex_sigs, ""], ["ceil", 1, 1, (macro_td, "NUM_CCEIL"), complex_complex_sigs, ""], ["maximum", 2, 1, (function_td, "NUM_CMAX"), complex_complex_sigs, ""], ["minimum", 2, 1, (function_td, "NUM_CMIN"), complex_complex_sigs, ""], ["fabs", 1, 1, (macro_td, "NUM_CFABS"), complex_complex_sigs, ""], ["_round", 1, 1, (macro_td, "NUM_CROUND"), complex_complex_sigs, ""], ["hypot", 2, 1, (macro_td, "NUM_CHYPOT"), complex_complex_sigs, ""], ] class UFuncParams: def __init__(self, pyname, ninputs, noutputs, form, sigs, opt_declarations, template = None, vslist=None): self.pyname = pyname self.ninputs = ninputs self.noutputs = noutputs self.form = form self.sigs = sigs self.opt_decls = opt_declarations # Select appropriate base template form. self.template = template self.vslist = vslist # select appropriate computation form (operator vs function) # opdict = ufo.form[0].copy() self.operator = self.form[1] # for operator1, operator_sv, operator_vs, operator_vv...: # Substitute actual operator/function for for key in self.form[0].keys(): self.__dict__[key] = self.form[0][key] % self.__dict__ #*********************************************************************# # # # PROGRAM SECTION # # # #*********************************************************************# """ The classes below assemble the various elements defined in the previous part of the module into the final C modules. Each subclass of CodeGenerator works basically the same way: It is constructed by supplying optional module unique header, tail, and function separator. When called, a CodeGenerator builds up two lists of strings by calling its "bodygenerator()" method. Looping over a parameter table, the bodygenerator builds: 1. A code list containing the instantiated header and emitted function bodies. This is the bulk of the code. 2. A function list containing the C struct initializers which are used to register the function bodies with python. These are necessarily in a seperate textual segment so that they may be joined in an array and looped over at initialization time. In general, templates are instantiated by formatting them either using a CodeGenerator instance dict, or a Params instance dict. After generating its two lists, a CodeGenerator combines them into the complete C code for a python module and writes the code out to the specified file. CodeGenerator subclasses customize behavior by overriding the "bodygenerator" and "addcfunc" methods. Each "bodygenerator" tends to be tailored to the parameter table used to specify the cfuncs for the module. Several of the codegenerators (cconv, ufunc, bytes) are supported by a "Params" class, instances of which act as table records. As the body generator loops over the parameter table, it creates a Params instance from each record. The Params instance dictionary then provides a source of keyword values to instantiate the code template. See ConvParams, ByteParams, and UfuncParams. Each is essentially a struct. In general, template instantiation is performed by string substitution using the python %(identifier)s syntax. The %(indentifer)s syntax permits a string to be formatted using a dictionary to supply identifier values. """ class CodeGenerator: """Generates source code using supplied functions and code templates""" def __init__(self, header=_HEADER, tail=_TAIL, separator=_TYPE_SEPARATOR): self.header = header self.tail = tail self.separator = separator self.module_methods = "" def __call__(self, file=None, Type=None): self.codelist = [ self.header % self.__dict__] self.funclist = [ _CFUNCDICT_HEADER ] if Type is None: self.bodygenerator() else: self.bodygenerator(Type) self.funclist.append(_CFUNCDICT_TAIL) self.codelist.append(_METHODS_DEF % self.__dict__) self.codelist.extend(self.funclist) self.codelist.append(self.tail % self.__dict__) sourcecode = "".join(self.codelist) if file: f = open(file,"w") f.write(sourcecode) f.close() else: return sourcecode def addcfunc(self, name, key=None): if key is None: key = name self.funclist.append(_ADDCFUNC_TEMPLATE % (key, name)) def addmethod(self, name, key=None): if key is None: key = name self.module_methods += (ADDMETHOD_TEMPLATE % (key, name)) class ConvCodeGenerator(CodeGenerator): def __init__(self, *components): CodeGenerator.__init__(self, *components) self.module = "conv" def addcfunc(self, type, name): CodeGenerator.addcfunc(self, type+name, key=repr((type, name))) def bodygenerator(self): """Generates the repetitive sections of code for conversions""" # Iterate over the "from" datatype. for cfg1 in typeconfig: t1 = apply(ConvParams, cfg1) if t1.typename in ["Complex32","Complex64"]: frompy = COMPLEX_FROM_PyVALUE_TEMPLATE aspy = COMPLEX_AS_PyVALUE_TEMPLATE else: frompy = FROM_PyVALUE_TEMPLATE aspy = AS_PyVALUE_TEMPLATE self.codelist.append((self.separator + aspy + frompy) % \ t1.__dict__) self.addcfunc(t1.typename, "asPyValue") self.addcfunc(t1.typename, "fromPyValue") # Iterate over the "to" datatype for cfg2 in typeconfig: t2 = apply(ConvParams, cfg2) if cfg1 == cfg2: continue t1.desttypename = t2.typename t1.desttypecast = t2.typecast t1.numarray_to_numarray = numarray_to_numarray(t1.typename, t2.typename) % t1.__dict__ self.codelist.append(CONVERSION_TEMPLATE % t1.__dict__) typetup = repr((t1.typename, t2.typename)) name = t1.typename + "as" + t2.typename self.funclist.append(_ADDCFUNC_TEMPLATE % (typetup, name)) class SortCodeGenerator(CodeGenerator): def __init__(self, *components): CodeGenerator.__init__(self, *components) self.module = "sort" def addcfunc(self, type, name): CodeGenerator.addcfunc(self, name+type, key=repr((type, name))) def bodygenerator(self): for cfg in typeconfig: t = apply(ConvParams, cfg) if t.typename in ["Complex32","Complex64"]: t.__dict__.update(sort_complex_td) else: t.__dict__.update(sort_operator_td) self.codelist.append((self.separator + SORT_TEMPLATE) % t.__dict__) self.addcfunc(t.typename, "sort") self.addcfunc(t.typename, "asort") self.addcfunc(t.typename, "searchsorted") self.addcfunc(t.typename, "fillarray") self.addcfunc(t.typename, "mxmultiply") self.addcfunc(t.typename, "nonzeroCoords") class BytesCodeGenerator(CodeGenerator): def __init__(self, *components): CodeGenerator.__init__(self, *components) self.module = "bytes" def bodygenerator(self): for cfg in bytesconfig: t = apply(BytesParams, cfg) self.codelist.append((self.separator + BYTES_TEMPLATE) % t.__dict__) self.addcfunc("copy"+ t.sizename) self.addcfunc("byteswap"+t.sizename) self.addcfunc("align"+t.sizename) self.addcfunc("choose"+t.sizename) self.codelist.append((self.separator + CHOOSE_TEMPLATE) % NBytesParams.__dict__) self.addcfunc("chooseNbytes") self.addcfunc("copyNbytes") self.addcfunc("putNbytes") self.addcfunc("takeNbytes") # Hack in the type based (not size based) methods for complex self.codelist.append((self.separator + BYTESWAP_TEMPLATE) % Complex32BytesCfg.__dict__) self.addcfunc("byteswapComplex32" ) self.codelist.append((self.separator + BYTESWAP_TEMPLATE) % Complex64BytesCfg.__dict__) self.addcfunc("byteswapComplex64" ) self.addmethod("copyToString") class UFuncCodeGenerator(CodeGenerator): def __init__(self, *components): CodeGenerator.__init__(self, *components) def bodygenerator(self, Type): """Generates the repetitive sections of code.""" self.module = "ufunc" + Type # Loop over ufunc table for cfg in ufuncconfigs: ufo = apply(UFuncParams, cfg) self.codelist.append(self.separator % ufo.pyname) # Loop over signatures for given ufunc for sig in ufo.sigs: if ufo.ninputs + ufo.noutputs != len(sig): # populate default signatures sig = (sig[0],)*ufo.ninputs + (sig[1],)*ufo.noutputs for i in range(ufo.ninputs): setattr(ufo, "intype%d" % i, sig[i]); for i in range(ufo.noutputs): setattr(ufo, "outtype%d" % i, sig[i+ufo.ninputs]); if ufo.intype0 != Type: continue if ufo.template is None: if ufo.ninputs == 1: ufo.template = UFUNC_UNARY_TEMPLATE ufo.vslist = ['vector'] elif ufo.ninputs == 2: if sig[0] == sig[-1]: ufo.template = UFUNC_BINARY_TEMPLATE ufo.vslist = ['vector_vector','vector_scalar','scalar_vector', 'reduce', 'accumulate'] else: ufo.template = UFUNC_COMPARE_TEMPLATE ufo.vslist = ['vector_vector','vector_scalar','scalar_vector'] else: raise ValueError("Can't handle ufuncs with > 2 inputs") # Expand opt_decls in terms of ufo vars ufo.optional_declarations = ufo.opt_decls % ufo.__dict__ # Expand template in terms of ufo vars self.codelist.append(ufo.template % ufo.__dict__) # for each form, add for form in ufo.vslist: if form in ["accumulate","reduce"]: sig2 = ((sig[0],),(sig[1],)) else: sig2 = (sig[:ufo.ninputs],sig[-ufo.noutputs:],) self.addcfunc(name=ufo.pyname+"_"+ufo.intype0+"_"+form, key=repr((ufo.pyname, form, sig2))) #*********************************************************************# generate_conv_code = ConvCodeGenerator() generate_sort_code = SortCodeGenerator(SORT_HEADER) generate_bytes_code = BytesCodeGenerator(BYTES_HEADER) generate_ufunc_code = UFuncCodeGenerator(UFUNC_HEADER, _TAIL, "/********************* %s *********************/\n") def generate(Name, Type=None): if Type is None: s = "generate_%s_code('Src/_%smodule.c')" % (Name, Name) else: s = "generate_%s_code('Src/_%smodule.c', '%s')" % \ (Name, Name+Type, Type) eval(s) # # PseudoMake compares the modification date of Lib/codegenerator.py # to the source code module implied by Name. If the codegenerator is # newer, the specified module is regenerated. # # # This code is written to be executed from the parent directory of Lib, # where setup.py resides. # def PseudoMake(Name, Type=None): if Type is None: Source = "Src/_%smodule.c" % Name else: Source = "Src/_%smodule.c" % (Name+Type) timemodgen = os.path.getmtime("Lib/codegenerator.py") # If codegenerator module more recent, regenerate Source if os.path.exists(Source): timemod = os.path.getmtime(Source) else: timemod = -1 if timemodgen > timemod or "--check-dates" not in sys.argv: print "generating new version of", Source generate(Name, Type) def GenAll(): PseudoMake("conv") PseudoMake("sort") PseudoMake("bytes") types = ["Bool", "Int8", "UInt8", "Int16", "UInt16", "Int32", "UInt32", "Float32", "Float64", "Complex32","Complex64"] types.append("Int64") if hasUInt64(): types.append("UInt64") for T in types: PseudoMake("ufunc",T) main = GenAll if __name__ == "__main__": GenAll()