hace 6 años · bdcd4db94f
--- a/SquiLu-ext/nn.c
+++ b/SquiLu-ext/nn.c
@@ -0,0 +1,1052 @@
 
															+/* RPROP Neural Networks implementation
														
 
															+ * See: http://deeplearning.cs.cmu.edu/pdfs/Rprop.pdf
														
 
															+ *
														
 
															+ * Copyright (c) 2003-2016, Salvatore Sanfilippo <antirez at gmail dot com>
														
 
															+ * All rights reserved.
														
 
															+ *
														
 
															+ * Redistribution and use in source and binary forms, with or without
														
 
															+ * modification, are permitted provided that the following conditions are met:
														
 
															+ *
														
 
															+ *   * Redistributions of source code must retain the above copyright notice,
														
 
															+ *     this list of conditions and the following disclaimer.
														
 
															+ *   * Redistributions in binary form must reproduce the above copyright
														
 
															+ *     notice, this list of conditions and the following disclaimer in the
														
 
															+ *     documentation and/or other materials provided with the distribution.
														
 
															+ *   * Neither the name of Disque nor the names of its contributors may be used
														
 
															+ *     to endorse or promote products derived from this software without
														
 
															+ *     specific prior written permission.
														
 
															+ *
														
 
															+ * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
														
 
															+ * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
														
 
															+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
														
 
															+ * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
														
 
															+ * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
														
 
															+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
														
 
															+ * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
														
 
															+ * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
														
 
															+ * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
														
 
															+ * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
														
 
															+ * POSSIBILITY OF SUCH DAMAGE.
														
 
															+ */
														
 
															+
														
 
															+#include <stdio.h>
														
 
															+#include <stdlib.h>
														
 
															+#include <math.h>
														
 
															+#include <time.h>
														
 
															+#include <string.h>
														
 
															+
														
 
															+#include "nn.h"
														
 
															+
														
 
															+#if defined(USE_AVX512)
														
 
															+#define USING_SIMD
														
 
															+#include <immintrin.h>
														
 
															+
														
 
															+typedef __m512 simdf_t;
														
 
															+#define  SIMDF_SIZE 16
														
 
															+
														
 
															+#define simdf_zero() _mm512_setzero_ps()
														
 
															+#define simdf_set1f(x) _mm512_set1_ps(x)
														
 
															+#define simdf_loadu(x) _mm512_loadu_ps(x)
														
 
															+#define simdf_load(x) _mm512_load_ps(x)
														
 
															+#define simdf_mul(a,b) _mm512_mul_ps(a,b)
														
 
															+#define simdf_add(a,b) _mm512_add_ps(a,b)
														
 
															+#define simdf_storeu(a,b) _mm512_storeu_ps(a,b)
														
 
															+#define simdf_store(a,b) _mm512_store_ps(a,b)
														
 
															+
														
 
															+//let the compiler optmize this
														
 
															+#define simdf_sum(x) (x[0] + x[1] + x[2] + x[3] + x[4] + x[5] + x[6] + x[7] + \
														
 
															+                                x[8] + x[9] + x[10] + x[11] + x[12] + x[13] + x[14] + x[15])
														
 
															+
														
 
															+#define simdf_show(x) printf("%d : %f, %f, %f, %f, %f, %f, %f, %f, %f, %f, %f, %f, %f, %f, %f, %f\n", \
														
 
															+                                __LINE__, x[0], x[1], x[2], x[3], x[4], x[5], x[6], x[7], \
														
 
															+                                x[8], x[9], x[10], x[11], x[12], x[13], x[14], x[15]);
														
 
															+#endif
														
 
															+
														
 
															+#if defined(USE_AVX)
														
 
															+#define USING_SIMD
														
 
															+#include <immintrin.h>
														
 
															+
														
 
															+typedef __m256 simdf_t;
														
 
															+#define  SIMDF_SIZE 8
														
 
															+
														
 
															+#define simdf_zero() _mm256_setzero_ps()
														
 
															+#define simdf_set1f(x) _mm256_set1_ps(x)
														
 
															+#define simdf_loadu(x) _mm256_loadu_ps(x)
														
 
															+#define simdf_load(x) _mm256_load_ps(x)
														
 
															+#define simdf_mul(a,b) _mm256_mul_ps(a,b)
														
 
															+#define simdf_add(a,b) _mm256_add_ps(a,b)
														
 
															+#define simdf_storeu(a,b) _mm256_storeu_ps(a,b)
														
 
															+#define simdf_store(a,b) _mm256_store_ps(a,b)
														
 
															+
														
 
															+//let the compiler optmize this
														
 
															+#define simdf_sum(x) (x[0] + x[1] + x[2] + x[3] + x[4] + x[5] + x[6] + x[7])
														
 
															+
														
 
															+#define simdf_show(x) printf("%d : %f, %f, %f, %f, %f, %f, %f, %f\n", \
														
 
															+                                __LINE__, x[0], x[1], x[2], x[3], x[4], x[5], x[6], x[7]);
														
 
															+#endif
														
 
															+
														
 
															+#if defined(USE_SSE)
														
 
															+#define USING_SIMD
														
 
															+#include <xmmintrin.h>
														
 
															+#include <pmmintrin.h>
														
 
															+
														
 
															+typedef __m128 simdf_t;
														
 
															+#define  SIMDF_SIZE 4
														
 
															+
														
 
															+#define simdf_zero() _mm_setzero_ps()
														
 
															+#define simdf_set1f(x) _mm_set1_ps(x)
														
 
															+#define simdf_loadu(x) _mm_loadu_ps(x)
														
 
															+#define simdf_load(x) _mm_load_ps(x)
														
 
															+#define simdf_mul(a,b) _mm_mul_ps(a,b)
														
 
															+#define simdf_add(a,b) _mm_add_ps(a,b)
														
 
															+#define simdf_storeu(a,b) _mm_storeu_ps(a,b)
														
 
															+#define simdf_store(a,b) _mm_store_ps(a,b)
														
 
															+
														
 
															+//let the compiler optmize this
														
 
															+#define simdf_sum(x) (x[0] + x[1] + x[2] + x[3])
														
 
															+
														
 
															+#define simdf_show(x) printf("%d : %f, %f, %f, %f\n", __LINE__, x[0], x[1], x[2], x[3]);
														
 
															+#endif
														
 
															+
														
 
															+#if defined(USE_NEON)
														
 
															+#define USING_SIMD
														
 
															+#include <arm_neon.h>
														
 
															+
														
 
															+typedef ann_float_t32x4_t simdf_t;
														
 
															+#define  SIMDF_SIZE 4
														
 
															+
														
 
															+#define simdf_zero() vdupq_n_f32(0.0f)
														
 
															+#define simdf_set1f(x) vdupq_n_f32(x);
														
 
															+#define simdf_loadu(x) vld1q_f32(x)
														
 
															+#define simdf_load(x) vld1q_f32(x)
														
 
															+#define simdf_mul(a,b) vmulq_f32(a,b)
														
 
															+#define simdf_add(a,b) vaddq_f32(a,b)
														
 
															+#define simdf_storeu(a,b) vst1q_f32((ann_float_t32_t*)a,b)
														
 
															+#define simdf_store(a,b) vst1q_f32((ann_float_t32_t*)a,b)
														
 
															+
														
 
															+//let the compiler optmize this
														
 
															+#define simdf_sum(x) (x[0] + x[1] + x[2] + x[3])
														
 
															+
														
 
															+#define simdf_show(x) printf("%d : %f, %f, %f, %f\n", __LINE__, x[0], x[1], x[2], x[3]);
														
 
															+#endif
														
 
															+
														
 
															+#ifndef SIMDF_SIZE
														
 
															+#define SIMDF_SIZE 1
														
 
															+#endif // SIMDF_SIZE
														
 
															+
														
 
															+#define ANN_SIZEOF_ann_float_t sizeof(ann_float_t)
														
 
															+#define ANN_ALIGN_BASE (SIMDF_SIZE * ANN_SIZEOF_ann_float_t)
														
 
															+#define ANN_ALIGN_ROUND(x) ((x%ANN_ALIGN_BASE) ? (((x/ANN_ALIGN_BASE)+1)*ANN_ALIGN_BASE) : (size_t)x)
														
 
															+
														
 
															+#ifndef HAS_ANN_MALLOC
														
 
															+#define ann_malloc(x) malloc(x)
														
 
															+#define ann_free(x) free(x)
														
 
															+#else
														
 
															+extern void *ann_malloc(size_t sz);
														
 
															+extern void ann_free(void *ptr);
														
 
															+#endif
														
 
															+/*
														
 
															+void *nnpmalloc(int line, size_t sz) {
														
 
															+	printf("%d : %zu : %zu\n", line, sz, ANN_ALIGN_ROUND(sz));
														
 
															+	return malloc(sz);
														
 
															+}
														
 
															+#define ann_malloc(x) nnpmalloc(__LINE__, x)
														
 
															+*/
														
 
															+
														
 
															+/* Node Transfer Function */
														
 
															+ann_float_t AnnTransferFunctionSigmoid(ann_float_t x) {
														
 
															+    //if(x < -15) return 0;
														
 
															+    //else if(x > 15) return 1;
														
 
															+    return ((ann_float_t)1.0)/(1.0+exp(-x));
														
 
															+}
														
 
															+
														
 
															+ann_float_t AnnTransferFunctionRelu(ann_float_t x) {
														
 
															+    return (x > 0.0) ? x : 0.0;
														
 
															+}
														
 
															+
														
 
															+ann_float_t AnnTransferFunctionTanh(ann_float_t x) {
														
 
															+    return tanh(x);
														
 
															+}
														
 
															+
														
 
															+/*
														
 
															+ann_float_t AnnDerivativeIdentity(ann_float_t x) {
														
 
															+    return 1;
														
 
															+}
														
 
															+*/
														
 
															+
														
 
															+ann_float_t AnnDerivativeSigmoid(ann_float_t x) {
														
 
															+    return x*(1-x);
														
 
															+}
														
 
															+
														
 
															+ann_float_t AnnDerivativeTanh(ann_float_t x) {
														
 
															+    return (1-x)*(1+x);
														
 
															+}
														
 
															+
														
 
															+ann_float_t AnnDerivativeRelu(ann_float_t x) {
														
 
															+    return (x > 0) ? 1 : 0;
														
 
															+}
														
 
															+
														
 
															+/* Reset layer data to zero-units */
														
 
															+void AnnResetLayer(AnnLayer *layer) {
														
 
															+    layer->units = 0;
														
 
															+    layer->units_aligned = 0;
														
 
															+    layer->output = NULL;
														
 
															+    layer->error = NULL;
														
 
															+    layer->weight = NULL;
														
 
															+    layer->gradient = NULL;
														
 
															+    layer->pgradient = NULL;
														
 
															+    layer->delta = NULL;
														
 
															+    layer->sgradient = NULL;
														
 
															+}
														
 
															+
														
 
															+/* Allocate and return an initialized N-layers network */
														
 
															+AnnRprop *AnnAlloc(int layers) {
														
 
															+    AnnRprop *net;
														
 
															+    int i;
														
 
															+
														
 
															+    /* Alloc the net structure */
														
 
															+    if ((net = ann_malloc(sizeof(*net))) == NULL)
														
 
															+        return NULL;
														
 
															+    /* Alloc layers */
														
 
															+    if ((net->layer = ann_malloc(sizeof(AnnLayer)*layers)) == NULL) {
														
 
															+        ann_free(net);
														
 
															+        return NULL;
														
 
															+    }
														
 
															+    net->layers = layers;
														
 
															+    net->flags = 0;
														
 
															+    net->rprop_nminus = ANN_DEFAULT_RPROP_NMINUS;
														
 
															+    net->rprop_nplus = ANN_DEFAULT_RPROP_NPLUS;
														
 
															+    net->rprop_maxupdate = ANN_DEFAULT_RPROP_MAXUPDATE;
														
 
															+    net->rprop_minupdate = ANN_DEFAULT_RPROP_MINUPDATE;
														
 
															+    net->node_transf_func = AnnTransferFunctionSigmoid;
														
 
															+    net->derivative_func = AnnDerivativeSigmoid;
														
 
															+    /* Init layers */
														
 
															+    for (i = 0; i < layers; i++)
														
 
															+        AnnResetLayer(&net->layer[i]);
														
 
															+    return net;
														
 
															+}
														
 
															+
														
 
															+/* Free a single layer */
														
 
															+void AnnFreeLayer(AnnLayer *layer)
														
 
															+{
														
 
															+    ann_free(layer->output);
														
 
															+    ann_free(layer->error);
														
 
															+    ann_free(layer->weight);
														
 
															+    ann_free(layer->gradient);
														
 
															+    ann_free(layer->pgradient);
														
 
															+    ann_free(layer->delta);
														
 
															+    ann_free(layer->sgradient);
														
 
															+    AnnResetLayer(layer);
														
 
															+}
														
 
															+
														
 
															+/* Free the target net */
														
 
															+void AnnFree(AnnRprop *net)
														
 
															+{
														
 
															+    int i;
														
 
															+
														
 
															+    /* Free layer data */
														
 
															+    for (i = 0; i < net->layers; i++) AnnFreeLayer(&net->layer[i]);
														
 
															+    /* Free allocated layers structures */
														
 
															+    ann_free(net->layer);
														
 
															+    /* And the main structure itself */
														
 
															+    ann_free(net);
														
 
															+}
														
 
															+
														
 
															+/* Init a layer of the net with the specified number of units.
														
 
															+ * Return non-zero on out of memory. */
														
 
															+int AnnInitLayer(AnnRprop *net, int i, int units, int bias) {
														
 
															+    if (bias) units++; /* Take count of the bias unit */
														
 
															+    size_t ann_float_t_units = ANN_ALIGN_ROUND(units*ANN_SIZEOF_ann_float_t);
														
 
															+    size_t units_aligned = ann_float_t_units/ANN_SIZEOF_ann_float_t;
														
 
															+    size_t ann_float_t_units_units = 0;
														
 
															+    AnnLayer *layer = &ANN_LAYER(net, i);
														
 
															+    layer->units = units;
														
 
															+    layer->units_aligned = units_aligned;
														
 
															+    layer->output = ann_malloc(ann_float_t_units);
														
 
															+    layer->error = ann_malloc(ann_float_t_units);
														
 
															+    if (i) { /* not for output layer */
														
 
															+        ann_float_t_units_units = ann_float_t_units*ANN_LAYER(net, i-1).units;
														
 
															+        layer->weight = ann_malloc(ann_float_t_units_units);
														
 
															+        layer->gradient = ann_malloc(ann_float_t_units_units);
														
 
															+        layer->pgradient = ann_malloc(ann_float_t_units_units);
														
 
															+        layer->delta = ann_malloc(ann_float_t_units_units);
														
 
															+        layer->sgradient = ann_malloc(ann_float_t_units_units);
														
 
															+    }
														
 
															+    /* Check for out of memory conditions */
														
 
															+    if (layer->output == NULL ||
														
 
															+        layer->error == NULL ||
														
 
															+        (i && layer->weight == NULL) ||
														
 
															+        (i && layer->gradient == NULL) ||
														
 
															+        (i && layer->pgradient == NULL) ||
														
 
															+        (i && layer->sgradient == NULL) ||
														
 
															+        (i && layer->delta == NULL))
														
 
															+    {
														
 
															+        AnnFreeLayer(layer);
														
 
															+        AnnResetLayer(layer);
														
 
															+        return 1;
														
 
															+    }
														
 
															+    /* Set all the values to zero */
														
 
															+    memset(layer->output, 0, ann_float_t_units);
														
 
															+    memset(layer->error, 0, ann_float_t_units);
														
 
															+    if (i) {
														
 
															+        memset(layer->weight, 0, ann_float_t_units_units);
														
 
															+        memset(layer->gradient, 0, ann_float_t_units_units);
														
 
															+        memset(layer->pgradient, 0, ann_float_t_units_units);
														
 
															+        memset(layer->delta, 0, ann_float_t_units_units);
														
 
															+        memset(layer->sgradient, 0, ann_float_t_units_units);
														
 
															+    }
														
 
															+    /* Set the bias unit output to 1 */
														
 
															+    if (bias) layer->output[units-1] = 1;
														
 
															+    return 0;
														
 
															+}
														
 
															+
														
 
															+/* Clone a network. On out of memory NULL is returned. */
														
 
															+AnnRprop *AnnClone(const AnnRprop* net) {
														
 
															+    AnnRprop* copy;
														
 
															+    int j;
														
 
															+
														
 
															+    if ((copy = AnnAlloc(ANN_LAYERS(net))) == NULL) return NULL;
														
 
															+    for (j = 0; j < ANN_LAYERS(net); j++) {
														
 
															+        AnnLayer *ldst;
														
 
															+        const AnnLayer *lsrc;
														
 
															+        int units = ANN_UNITS(net,j);
														
 
															+        int bias = j > 0;
														
 
															+        if (AnnInitLayer(copy, j, units-bias, bias)) {
														
 
															+            AnnFree(copy);
														
 
															+            return NULL;
														
 
															+        }
														
 
															+        int ann_float_t_units = units*ANN_SIZEOF_ann_float_t;
														
 
															+        lsrc = &net->layer[j];
														
 
															+        ldst = &copy->layer[j];
														
 
															+        if (lsrc->output)
														
 
															+            memcpy(ldst->output, lsrc->output, ann_float_t_units);
														
 
															+        if (lsrc->error)
														
 
															+            memcpy(ldst->error, lsrc->error, ann_float_t_units);
														
 
															+        if (j) {
														
 
															+            int weights = ANN_WEIGHTS(net,j);
														
 
															+            ann_float_t_units = weights*ANN_SIZEOF_ann_float_t;
														
 
															+            if (lsrc->weight)
														
 
															+                memcpy(ldst->weight, lsrc->weight, ann_float_t_units);
														
 
															+            if (lsrc->gradient)
														
 
															+                memcpy(ldst->gradient, lsrc->gradient, ann_float_t_units);
														
 
															+            if (lsrc->pgradient)
														
 
															+                memcpy(ldst->pgradient, lsrc->pgradient, ann_float_t_units);
														
 
															+            if (lsrc->delta)
														
 
															+                memcpy(ldst->delta, lsrc->delta, ann_float_t_units);
														
 
															+            if (lsrc->sgradient)
														
 
															+                memcpy(ldst->sgradient, lsrc->sgradient, ann_float_t_units);
														
 
															+        }
														
 
															+    }
														
 
															+    copy->rprop_nminus = net->rprop_nminus;
														
 
															+    copy->rprop_nplus = net->rprop_nplus;
														
 
															+    copy->rprop_maxupdate = net->rprop_maxupdate;
														
 
															+    copy->rprop_minupdate = net->rprop_minupdate;
														
 
															+    copy->flags = net->flags;
														
 
															+    copy->node_transf_func = net->node_transf_func;
														
 
															+    copy->derivative_func = net->derivative_func;
														
 
															+    return copy;
														
 
															+}
														
 
															+
														
 
															+/* Create a N-layer input/hidden/output net.
														
 
															+ * The units array should specify the number of
														
 
															+ * units in every layer from the output to the input layer. */
														
 
															+AnnRprop *AnnCreateNet(int layers, int *units) {
														
 
															+    AnnRprop *net;
														
 
															+    int i;
														
 
															+
														
 
															+    if ((net = AnnAlloc(layers)) == NULL) return NULL;
														
 
															+    for (i = 0; i < layers; i++) {
														
 
															+        if (AnnInitLayer(net, i, units[i], i > 0)) {
														
 
															+            AnnFree(net);
														
 
															+            return NULL;
														
 
															+        }
														
 
															+    }
														
 
															+    AnnSetRandomWeights(net);
														
 
															+    AnnSetDeltas(net, ANN_RPROP_INITIAL_DELTA);
														
 
															+    ANN_LEARN_RATE(net) = ANN_DEFAULT_LEARN_RATE;
														
 
															+    return net;
														
 
															+}
														
 
															+
														
 
															+/* Return the total number of weights this NN has. */
														
 
															+size_t AnnCountWeights(AnnRprop *net) {
														
 
															+    size_t weights = 0;
														
 
															+    for (int i = ANN_LAYERS(net)-1; i > 0; i--) {
														
 
															+        int nextunits = ANN_UNITS(net, i-1);
														
 
															+        int units = ANN_UNITS(net, i);
														
 
															+        if (i > 1) nextunits--; /* we don't output on bias units */
														
 
															+        weights += units*nextunits;
														
 
															+    }
														
 
															+    return weights;
														
 
															+}
														
 
															+
														
 
															+/* Create a 4-layer input/hidden/output net */
														
 
															+AnnRprop *AnnCreateNet4(int iunits, int hunits, int hunits2, int ounits) {
														
 
															+    int units[4];
														
 
															+
														
 
															+    units[0] = ounits;
														
 
															+    units[1] = hunits2;
														
 
															+    units[2] = hunits;
														
 
															+    units[3] = iunits;
														
 
															+    return AnnCreateNet(4, units);
														
 
															+}
														
 
															+
														
 
															+/* Create a 3-layer input/hidden/output net */
														
 
															+AnnRprop *AnnCreateNet3(int iunits, int hunits, int ounits) {
														
 
															+    int units[3];
														
 
															+
														
 
															+    units[0] = ounits;
														
 
															+    units[1] = hunits;
														
 
															+    units[2] = iunits;
														
 
															+    return AnnCreateNet(3, units);
														
 
															+}
														
 
															+
														
 
															+
														
 
															+/* Create a 2-layer "linear" network. */
														
 
															+AnnRprop *AnnCreateNet2(int iunits, int ounits) {
														
 
															+    int units[2];
														
 
															+
														
 
															+    units[0] = ounits;
														
 
															+    units[1] = iunits;
														
 
															+    return AnnCreateNet(2, units);
														
 
															+}
														
 
															+
														
 
															+void AnnSimulate(AnnRprop *net) {
														
 
															+    int i, j, k;
														
 
															+
														
 
															+    for (i = ANN_LAYERS(net)-1; i > 0; i--) {
														
 
															+        AnnLayer *layer = &ANN_LAYER(net, i);
														
 
															+        int nextunits = ANN_UNITS(net, i-1);
														
 
															+        int units_aligned = layer->units_aligned;
														
 
															+        int units = layer->units;
														
 
															+        if (i > 1) nextunits--; /* dont output on bias units */
														
 
															+#ifdef USING_SIMD
														
 
															+        int xps, psteps = units/SIMDF_SIZE;
														
 
															+#endif // USING_SIMD
														
 
															+        for (j = 0; j < nextunits; j++) {
														
 
															+            ann_float_t A = 0; /* Activation final value. */
														
 
															+            ann_float_t *w = layer->weight + j*units_aligned;
														
 
															+            ann_float_t *o = layer->output;
														
 
															+            k = 0;
														
 
															+
														
 
															+#ifdef USING_SIMD
														
 
															+            if(psteps)
														
 
															+            {
														
 
															+                simdf_t sumA = simdf_zero();
														
 
															+                for (xps = 0; xps < psteps; xps++) {
														
 
															+                    simdf_t weights = simdf_load(w);
														
 
															+                    simdf_t outputs = simdf_load(o);
														
 
															+                    simdf_t prod = simdf_mul(weights,outputs);
														
 
															+                    sumA = simdf_add(sumA, prod);
														
 
															+                    w += SIMDF_SIZE;
														
 
															+                    o += SIMDF_SIZE;
														
 
															+                }
														
 
															+                A += simdf_sum(sumA);
														
 
															+                k += psteps*SIMDF_SIZE;
														
 
															+            }
														
 
															+#endif
														
 
															+
														
 
															+            /* Handle final piece shorter than SIMDF_SIZE . */
														
 
															+            for (; k < units; k++) {
														
 
															+                A += (*w++) * (*o++);
														
 
															+            }
														
 
															+            ANN_OUTPUT(net, i-1, j) = (*net->node_transf_func)(A); //sigmoid(A);
														
 
															+        }
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Create a Tcl procedure that simulates the neural network */
														
 
															+void Ann2Tcl(const AnnRprop *net) {
														
 
															+    int i, j, k;
														
 
															+
														
 
															+    printf("proc ann input {\n");
														
 
															+    printf("    set output {");
														
 
															+    for (i = 0; i < ANN_OUTPUT_UNITS(net); i++) {
														
 
															+        printf("0 ");
														
 
															+    }
														
 
															+    printf("}\n");
														
 
															+    printf("    proc sigmoid x {return [expr {1/(1+exp(-$x))}]}\n");
														
 
															+    for(i=0, k=ANN_INPUT_UNITS(net); i < k; ++i) {
														
 
															+      printf("    set input_%d [lindex $input %d]\n", i, i);
														
 
															+    }
														
 
															+    for (i = ANN_LAYERS(net)-1; i > 0; i--) {
														
 
															+        int nextunits = ANN_UNITS(net, i-1);
														
 
															+        int units = ANN_UNITS(net, i);
														
 
															+        //if (i > 1) nextunits--; /* dont output on bias units */
														
 
															+        for (j = 0; j < nextunits; j++) {
														
 
															+            ann_float_t W;
														
 
															+            if (i == 1) {
														
 
															+                printf("    lset output %d ", j);
														
 
															+            } else {
														
 
															+                printf("    set O_%d_%d", i-1, j);
														
 
															+            }
														
 
															+            printf(" [sigmoid [expr { \\\n");
														
 
															+            for (k = 0; k < units; k++) {
														
 
															+                W = ANN_WEIGHT(net, i, k, j);
														
 
															+                if (i > 1 && k == units-1) {
														
 
															+                    printf("        (%.9f)", W);
														
 
															+                } else if (i == ANN_LAYERS(net)-1) {
														
 
															+                    printf("        (%.9f*$input_%d)", W, k);
														
 
															+                } else {
														
 
															+                    printf("        (%.9f*$O_%d_%d)", W, i, k);
														
 
															+                }
														
 
															+                if ((k+1) < units) printf("+ \\\n");
														
 
															+            }
														
 
															+            printf("}]]\n");
														
 
															+        }
														
 
															+    }
														
 
															+    printf("    return $output\n");
														
 
															+    printf("}\n");
														
 
															+}
														
 
															+
														
 
															+/* Create a Javascript procedure that simulates the neural network */
														
 
															+void Ann2Js(const AnnRprop *net) {
														
 
															+    int i, j, k;
														
 
															+
														
 
															+    printf("function ann( input ) {\n");
														
 
															+    printf("    var output = [");
														
 
															+    for (i = 0; i < ANN_OUTPUT_UNITS(net); i++) {
														
 
															+	if(i) printf(", ");
														
 
															+        printf("0");
														
 
															+    }
														
 
															+    printf("];\n");
														
 
															+    printf("    var sigmoid = function(x) {return 1.0/(1.0+Math.exp(-x));};\n");
														
 
															+    for(i=0, k=ANN_INPUT_UNITS(net); i < k; ++i) {
														
 
															+      printf("    var input_%d = input[%d];\n", i, i);
														
 
															+    }
														
 
															+    for (i = ANN_LAYERS(net)-1; i > 0; i--) {
														
 
															+        int nextunits = ANN_UNITS(net, i-1);
														
 
															+        int units = ANN_UNITS(net, i);
														
 
															+        //if (i > 1) nextunits--; /* dont output on bias units */
														
 
															+        for (j = 0; j < nextunits; j++) {
														
 
															+            ann_float_t W;
														
 
															+            if (i == 1) {
														
 
															+                printf("    output[%d]", j);
														
 
															+            } else {
														
 
															+                printf("    var O_%d_%d", i-1, j);
														
 
															+            }
														
 
															+            printf(" = sigmoid(\n");
														
 
															+            for (k = 0; k < units; k++) {
														
 
															+                W = ANN_WEIGHT(net, i, k, j);
														
 
															+                if (i > 1 && k == units-1) {
														
 
															+                    printf("        (%.9f)", W);
														
 
															+                } else if (i == ANN_LAYERS(net)-1) {
														
 
															+                    printf("        (%.9f*input_%d)", W, k);
														
 
															+                } else {
														
 
															+                    printf("        (%.9f*O_%d_%d)", W, i, k);
														
 
															+                }
														
 
															+                if ((k+1) < units) printf("+\n");
														
 
															+            }
														
 
															+            printf(");\n");
														
 
															+        }
														
 
															+    }
														
 
															+    printf("    return output;\n");
														
 
															+    printf("}\n");
														
 
															+}
														
 
															+
														
 
															+/* Print a network representation */
														
 
															+void AnnPrint(const AnnRprop *net) {
														
 
															+    int i, j, k;
														
 
															+
														
 
															+    for (i = 0; i < ANN_LAYERS(net); i++) {
														
 
															+        char *layertype = "Hidden";
														
 
															+        if (i == 0) layertype = "Output";
														
 
															+        if (i == ANN_LAYERS(net)-1) layertype = "Input";
														
 
															+        printf("%s layer %d, units %d\n", layertype, i, ANN_UNITS(net,i));
														
 
															+        if (i) {
														
 
															+            /* Don't compute the bias unit as a target. */
														
 
															+            int targets = ANN_UNITS(net,i-1) - (i-1>0);
														
 
															+            /* Weights */
														
 
															+            printf("\tW");
														
 
															+            for (j = 0; j < ANN_UNITS(net, i); j++) {
														
 
															+                printf("(");
														
 
															+                for (k = 0; k < targets; k++) {
														
 
															+                    printf("%f", ANN_WEIGHT(net,i,j,k));
														
 
															+                    if (k != targets-1) printf(" ");
														
 
															+                }
														
 
															+                printf(") ");
														
 
															+            }
														
 
															+            printf("\n");
														
 
															+            /* Gradients */
														
 
															+            printf("\tg");
														
 
															+            for (j = 0; j < ANN_UNITS(net, i); j++) {
														
 
															+                printf("[");
														
 
															+                for (k = 0; k < targets; k++) {
														
 
															+                    printf("%f", ANN_GRADIENT(net,i,j,k));
														
 
															+                    if (k != targets-1) printf(" ");
														
 
															+                }
														
 
															+                printf("] ");
														
 
															+            }
														
 
															+            printf("\n");
														
 
															+            /* SGradients */
														
 
															+            printf("\tG");
														
 
															+            for (j = 0; j < ANN_UNITS(net, i); j++) {
														
 
															+                printf("[");
														
 
															+                for (k = 0; k < targets; k++) {
														
 
															+                    printf("%f", ANN_SGRADIENT(net,i,j,k));
														
 
															+                    if (k != targets-1) printf(" ");
														
 
															+                }
														
 
															+                printf("] ");
														
 
															+            }
														
 
															+            printf("\n");
														
 
															+            /* Gradients at t-1 */
														
 
															+            printf("\tP");
														
 
															+            for (j = 0; j < ANN_UNITS(net, i); j++) {
														
 
															+                printf("[");
														
 
															+                for (k = 0; k < targets; k++) {
														
 
															+                    printf("%f", ANN_PGRADIENT(net,i,j,k));
														
 
															+                    if (k != targets-1) printf(" ");
														
 
															+                }
														
 
															+                printf("] ");
														
 
															+            }
														
 
															+            printf("\n");
														
 
															+            /* Delta */
														
 
															+            printf("\tD");
														
 
															+            for (j = 0; j < ANN_UNITS(net, i); j++) {
														
 
															+                printf("|");
														
 
															+                for (k = 0; k < targets; k++) {
														
 
															+                    printf("%f", ANN_DELTA(net,i,j,k));
														
 
															+                    if (k != targets-1) printf(" ");
														
 
															+                }
														
 
															+                printf("| ");
														
 
															+            }
														
 
															+            printf("\n");
														
 
															+        }
														
 
															+        for (j = 0; j < ANN_UNITS(net,i); j++) {
														
 
															+            printf("\tO: %f ", ANN_OUTPUT(net,i,j));
														
 
															+        }
														
 
															+        printf("\n");
														
 
															+        printf("\tE /");
														
 
															+        for (j = 0; j < ANN_UNITS(net,i); j++) {
														
 
															+            printf("%f ", ANN_ERROR(net,i,j));
														
 
															+        }
														
 
															+        printf("/\n");
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Calcuate the global error of the net. This is just the
														
 
															+ * Root Mean Square (RMS) error, which is half the sum of the squared
														
 
															+ * errors. */
														
 
															+ann_float_t AnnGlobalError(AnnRprop *net, ann_float_t *desired) {
														
 
															+    ann_float_t e, t;
														
 
															+    int i, outputs = ANN_OUTPUT_UNITS(net);
														
 
															+
														
 
															+    e = 0;
														
 
															+    for (i = 0; i < outputs; i++) {
														
 
															+        t = desired[i] - ANN_OUTPUT_NODE(net,i);
														
 
															+        e += t*t; /* No need for fabs(t), t*t will always be positive. */
														
 
															+    }
														
 
															+    return .5*e;
														
 
															+}
														
 
															+
														
 
															+/* Set the network input */
														
 
															+void AnnSetInput(AnnRprop *net, ann_float_t *input)
														
 
															+{
														
 
															+    int i, inputs = ANN_INPUT_UNITS(net);
														
 
															+
														
 
															+    for (i = 0; i < inputs; i++) ANN_INPUT_NODE(net,i) = input[i];
														
 
															+}
														
 
															+
														
 
															+/* Simulate the net, and return the global error */
														
 
															+ann_float_t AnnSimulateError(AnnRprop *net, ann_float_t *input, ann_float_t *desired) {
														
 
															+    AnnSetInput(net, input);
														
 
															+    AnnSimulate(net);
														
 
															+    return AnnGlobalError(net, desired);
														
 
															+}
														
 
															+
														
 
															+/* Compute the error vector y-t in the output unit. This error depends
														
 
															+ * on the loss function we use. */
														
 
															+void AnnCalculateOutputError(AnnRprop *net, ann_float_t *desired) {
														
 
															+    int units = ANN_OUTPUT_UNITS(net);
														
 
															+    ann_float_t factor = (ann_float_t)2/units;
														
 
															+    AnnLayer *layer = &ANN_LAYER(net, 0);
														
 
															+    for (int j = 0; j < units; j++) {
														
 
															+        layer->error[j] = factor * (layer->output[j] - desired[j]);
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Calculate gradients with a trivial and slow algorithm, this
														
 
															+ * is useful to check that the real implementation is working
														
 
															+ * well, comparing the results.
														
 
															+ *
														
 
															+ * The algorithm used is: to compute the error function in two
														
 
															+ * points (E1, with the real weight, and E2 with the weight W = W + 0.1),
														
 
															+ * than the approximation of the gradient is G = (E2-E1)/0.1. */
														
 
															+#define GTRIVIAL_DELTA 0.001
														
 
															+void AnnCalculateGradientsTrivial(AnnRprop *net, ann_float_t *desired) {
														
 
															+    int j, i, layers = ANN_LAYERS(net);
														
 
															+
														
 
															+    for (j = 1; j < layers; j++) {
														
 
															+        int weights = ANN_WEIGHTS(net,j);
														
 
															+        for (i = 0; i < weights; i++) {
														
 
															+            ann_float_t t, e1, e2;
														
 
															+            AnnLayer *layer = &ANN_LAYER(net,j);
														
 
															+
														
 
															+            /* Calculate the value of the error function
														
 
															+             * in this point. */
														
 
															+            AnnSimulate(net);
														
 
															+            e1 = AnnGlobalError(net, desired);
														
 
															+            t = layer->weight[i];
														
 
															+            /* Calculate the error a bit on the right */
														
 
															+            layer->weight[i] += GTRIVIAL_DELTA;
														
 
															+            AnnSimulate(net);
														
 
															+            e2 = AnnGlobalError(net, desired);
														
 
															+            /* Restore the original weight */
														
 
															+            layer->weight[i] = t;
														
 
															+            /* Calculate the gradient */
														
 
															+            layer->gradient[i] = (e2-e1)/GTRIVIAL_DELTA;
														
 
															+        }
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Calculate gradients using the back propagation algorithm */
														
 
															+void AnnCalculateGradients(AnnRprop *net, ann_float_t *desired) {
														
 
															+    int j, layers = ANN_LAYERS(net)-1;
														
 
															+
														
 
															+    /* Populate the error vector net->layer[0]->error according
														
 
															+     * to the loss function. */
														
 
															+    AnnCalculateOutputError(net,desired);
														
 
															+
														
 
															+    /* Back-propagate the error and compute the gradient
														
 
															+     * for every weight in the net. */
														
 
															+    for (j = 0; j < layers; j++) {
														
 
															+        AnnLayer *layer = &ANN_LAYER(net, j);
														
 
															+        AnnLayer *prev_layer = &ANN_LAYER(net, j+1);
														
 
															+        int i, units = layer->units;
														
 
															+        int prevunits = prev_layer->units;
														
 
															+        int prevunits_aligned = prev_layer->units_aligned;
														
 
															+#ifdef USING_SIMD
														
 
															+        int xps, psteps = prevunits/SIMDF_SIZE;
														
 
															+        simdf_t es;
														
 
															+#endif // USING_SIMD
														
 
															+        /* Skip bias units, they have no connections with the previous
														
 
															+         * layers. */
														
 
															+        if (j > 1) units--;
														
 
															+        /* Reset the next layer errors array */
														
 
															+        //for (i = 0; i < prevunits; i++) prev_layer->error[i] = 0;
														
 
															+        memset(prev_layer->error, 0, ANN_SIZEOF_ann_float_t*prevunits);
														
 
															+        /* For every node in this layer ... */
														
 
															+        for (i = 0; i < units; i++) {
														
 
															+            ann_float_t error_signal, ei, oi, derivative;
														
 
															+            int k;
														
 
															+
														
 
															+            /* Compute gradient. */
														
 
															+            ei = layer->error[i];
														
 
															+            oi = layer->output[i];
														
 
															+
														
 
															+            /* Common derivatives:
														
 
															+             *
														
 
															+             * identity: 1
														
 
															+             * sigmoid: oi*(1-oi)
														
 
															+             * softmax: oi*(1-oi)
														
 
															+             * tanh:    (1-oi)*(1+oi), that's 1-(oi*oi)
														
 
															+             * relu:    (oi > 0) ? 1 : 0
														
 
															+             */
														
 
															+            //derivative = oi*(1-oi);
														
 
															+            derivative = (*net->derivative_func)(oi);
														
 
															+            error_signal = ei*derivative;
														
 
															+
														
 
															+            /* For every weight between this node and
														
 
															+             * the previous layer's nodes: */
														
 
															+            ann_float_t *g = prev_layer->gradient + i*prevunits_aligned;
														
 
															+            ann_float_t *w = prev_layer->weight + i*prevunits_aligned;
														
 
															+            ann_float_t *o = prev_layer->output;
														
 
															+            ann_float_t *e = prev_layer->error;
														
 
															+
														
 
															+            /* 1. Calculate the gradient */
														
 
															+            k = 0;
														
 
															+
														
 
															+#ifdef USING_SIMD
														
 
															+            if(psteps)
														
 
															+            {
														
 
															+                es = simdf_set1f(error_signal);
														
 
															+//printf("%d : %ld\n", __LINE__, ((long)o & 15));
														
 
															+                for (xps = 0; xps < psteps; xps++) {
														
 
															+                    simdf_t outputs = simdf_load(o);
														
 
															+                    simdf_t gradients = simdf_mul(es,outputs);
														
 
															+                    simdf_store(g, gradients);
														
 
															+                    o += SIMDF_SIZE;
														
 
															+                    g += SIMDF_SIZE;
														
 
															+                }
														
 
															+                k += psteps*SIMDF_SIZE;
														
 
															+            }
														
 
															+#endif
														
 
															+
														
 
															+            /* Handle final piece shorter than SIMDF_SIZE . */
														
 
															+            for (; k < prevunits; k++) *g++ = error_signal*(*o++);
														
 
															+
														
 
															+            /* 2. And back-propagate the error to the previous layer */
														
 
															+            k = 0;
														
 
															+
														
 
															+#ifdef USING_SIMD
														
 
															+            if(psteps)
														
 
															+            {
														
 
															+//printf("%d : %ld\n", __LINE__, ((long)w & 15));
														
 
															+                for (xps = 0; xps < psteps; xps++) {
														
 
															+                    simdf_t weights = simdf_load(w);
														
 
															+                    simdf_t errors = simdf_load(e);
														
 
															+                    simdf_t prod = simdf_mul(es, weights);
														
 
															+                    simdf_store(e, simdf_add(prod , errors));
														
 
															+                    e += SIMDF_SIZE;
														
 
															+                    w += SIMDF_SIZE;
														
 
															+                }
														
 
															+                k += psteps*SIMDF_SIZE;
														
 
															+            }
														
 
															+#endif
														
 
															+            /* Handle final piece shorter than SIMDF_SIZE . */
														
 
															+            for (; k < prevunits; k++) {
														
 
															+                (*e++) += error_signal * (*w++);
														
 
															+            }
														
 
															+        }
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Set the delta values of the net to a given value */
														
 
															+void AnnSetDeltas(AnnRprop *net, ann_float_t val) {
														
 
															+    int j, layers = ANN_LAYERS(net);
														
 
															+
														
 
															+    for (j = 1; j < layers; j++) {
														
 
															+        int weights = ANN_WEIGHTS(net,j);
														
 
															+        int i;
														
 
															+        AnnLayer *layer = &ANN_LAYER(net, j);
														
 
															+        for (i = 0; i < weights; i++) layer->delta[i] = val;
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Set the sgradient values to zero */
														
 
															+void AnnResetSgradient(AnnRprop *net) {
														
 
															+    int j, layers = ANN_LAYERS(net);
														
 
															+
														
 
															+    for (j = 1; j < layers; j++) {
														
 
															+        int weights = ANN_WEIGHTS(net, j);
														
 
															+        memset(ANN_LAYER(net, j).sgradient, 0, ANN_SIZEOF_ann_float_t*weights);
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Set random weights in the range -0.05,+0.05 */
														
 
															+void AnnSetRandomWeights(AnnRprop *net) {
														
 
															+    int i, j, k;
														
 
															+
														
 
															+    for (i = 1; i < ANN_LAYERS(net); i++) {
														
 
															+        for (k = 0; k < ANN_UNITS(net, i-1); k++) {
														
 
															+            for (j = 0; j < ANN_UNITS(net, i); j++) {
														
 
															+                ANN_WEIGHT(net,i,j,k) = -0.05+.1*(rand()/(RAND_MAX+1.0));
														
 
															+            }
														
 
															+        }
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Scale the net weights of the given factor */
														
 
															+void AnnScaleWeights(AnnRprop *net, ann_float_t factor) {
														
 
															+    int j, layers = ANN_LAYERS(net);
														
 
															+
														
 
															+    for (j = 1; j < layers; j++) {
														
 
															+        int weights = ANN_WEIGHTS(net,j);
														
 
															+        int i;
														
 
															+        AnnLayer *layer = &ANN_LAYER(net, j);
														
 
															+        for (i = 0; i < weights; i++)
														
 
															+            layer->weight[i] *= factor;
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Update the sgradient, that's the sum of the weight's gradient for every
														
 
															+ * element of the training set. This is used for the RPROP algorithm
														
 
															+ * that works with the sign of the derivative for the whole set. */
														
 
															+void AnnUpdateSgradient(AnnRprop *net) {
														
 
															+    int j, i, layers = ANN_LAYERS(net);
														
 
															+
														
 
															+    for (j = 1; j < layers; j++) {
														
 
															+        int weights = ANN_WEIGHTS(net,j);
														
 
															+        ann_float_t *sg = net->layer[j].sgradient;
														
 
															+        ann_float_t *g = net->layer[j].gradient;
														
 
															+        i = 0;
														
 
															+#ifdef USING_SIMD
														
 
															+            int psteps = weights/SIMDF_SIZE;
														
 
															+            if(psteps)
														
 
															+            {
														
 
															+                int xps;
														
 
															+                for (xps = 0; xps < psteps; xps++) {
														
 
															+                    simdf_t sgradient = simdf_load(sg);
														
 
															+                    simdf_t gradient = simdf_load(g);
														
 
															+                    simdf_store(sg, simdf_add( sgradient, gradient));
														
 
															+                    sg += SIMDF_SIZE;
														
 
															+                    g += SIMDF_SIZE;
														
 
															+                }
														
 
															+                i += psteps*SIMDF_SIZE;
														
 
															+            }
														
 
															+#endif
														
 
															+        /* Handle final piece shorter than SIMDF_SIZE . */
														
 
															+        for (; i < weights; i++)
														
 
															+            (*sg++) += (*g++);
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Helper function for RPROP, returns -1 if n < 0, +1 if n > 0, 0 if n == 0 */
														
 
															+static inline ann_float_t sign(ann_float_t n) {
														
 
															+    if (n > 0) return +1.0;
														
 
															+    if (n < 0) return -1.0;
														
 
															+    return 0.0;
														
 
															+}
														
 
															+
														
 
															+/* The core of the RPROP algorithm.
														
 
															+ *
														
 
															+ * Note that:
														
 
															+ * sgradient is the set-wise gradient.
														
 
															+ * delta is the per-weight update value. */
														
 
															+void AnnAdjustWeightsResilientBP(AnnRprop *net) {
														
 
															+    int j, i, layers = ANN_LAYERS(net);
														
 
															+
														
 
															+    for (j = 1; j < layers; j++) {
														
 
															+        int weights = ANN_WEIGHTS(net,j) - (j-1>0);
														
 
															+        AnnLayer *layer = &ANN_LAYER(net, j);
														
 
															+        for (i = 0; i < weights; i++) {
														
 
															+            ann_float_t sgradient = layer->sgradient[i];
														
 
															+            ann_float_t t = layer->pgradient[i] * sgradient;
														
 
															+            ann_float_t delta = layer->delta[i];
														
 
															+            if (t > 0) {
														
 
															+                delta = ANN_MIN(delta*ANN_RPROP_NPLUS(net),ANN_RPROP_MAXUPDATE(net));
														
 
															+                ann_float_t wdelta = -sign(sgradient) * delta;
														
 
															+                layer->weight[i] += wdelta;
														
 
															+                layer->delta[i] = delta;
														
 
															+                layer->pgradient[i] = sgradient;
														
 
															+            } else if (t < 0) {
														
 
															+                ann_float_t past_wdelta = -sign(layer->pgradient[i]) * delta;
														
 
															+                delta = ANN_MAX(delta*ANN_RPROP_NMINUS(net),ANN_RPROP_MINUPDATE(net));
														
 
															+                layer->weight[i] -= past_wdelta;
														
 
															+                layer->delta[i] = delta;
														
 
															+                layer->pgradient[i] = 0;
														
 
															+            } else { /* t == 0 */
														
 
															+                ann_float_t wdelta = -sign(sgradient) * delta;
														
 
															+                layer->weight[i] += wdelta;
														
 
															+                layer->pgradient[i] = sgradient;
														
 
															+            }
														
 
															+        }
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Resilient Backpropagation Epoch */
														
 
															+ann_float_t AnnResilientBPEpoch(AnnRprop *net, ann_float_t *input, ann_float_t *desired, int setlen) {
														
 
															+    ann_float_t error = 0;
														
 
															+    int j, inputs = ANN_INPUT_UNITS(net), outputs = ANN_OUTPUT_UNITS(net);
														
 
															+
														
 
															+    AnnResetSgradient(net);
														
 
															+    for (j = 0; j < setlen; j++) {
														
 
															+        error += AnnSimulateError(net, input, desired);
														
 
															+        AnnCalculateGradients(net, desired);
														
 
															+        AnnUpdateSgradient(net);
														
 
															+        input += inputs;
														
 
															+        desired += outputs;
														
 
															+    }
														
 
															+    AnnAdjustWeightsResilientBP(net);
														
 
															+    return error / setlen;
														
 
															+}
														
 
															+
														
 
															+/* Update the deltas using the gradient descend algorithm.
														
 
															+ * Gradients should be already computed with AnnCalculateGraidents(). */
														
 
															+void AnnUpdateDeltasGD(AnnRprop *net) {
														
 
															+    int j, i, layers = ANN_LAYERS(net);
														
 
															+
														
 
															+    for (j = 1; j < layers; j++) {
														
 
															+        int weights = ANN_WEIGHTS(net,j);
														
 
															+        AnnLayer *layer = &ANN_LAYER(net, j);
														
 
															+        for (i = 0; i < weights; i++)
														
 
															+            layer->delta[i] += layer->gradient[i];
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Adjust net weights using the (already) calculated deltas. */
														
 
															+void AnnAdjustWeights(AnnRprop *net, int setlen) {
														
 
															+    int j, i, layers = ANN_LAYERS(net);
														
 
															+
														
 
															+    for (j = 1; j < layers; j++) {
														
 
															+        int weights = ANN_WEIGHTS(net,j);
														
 
															+        AnnLayer *layer = &ANN_LAYER(net, j);
														
 
															+        for (i = 0; i < weights; i++) {
														
 
															+            layer->weight[i] -= ANN_LEARN_RATE(net)/setlen*layer->delta[i];
														
 
															+        }
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Gradient Descend training */
														
 
															+ann_float_t AnnGDEpoch(AnnRprop *net, ann_float_t *input, ann_float_t *desidered, int setlen) {
														
 
															+    ann_float_t error = 0;
														
 
															+    int j, inputs = ANN_INPUT_UNITS(net), outputs = ANN_OUTPUT_UNITS(net);
														
 
															+
														
 
															+    for (j = 0; j < setlen; j++) {
														
 
															+        AnnSetDeltas(net, 0);
														
 
															+        error += AnnSimulateError(net, input, desidered);
														
 
															+        AnnCalculateGradients(net, desidered);
														
 
															+        AnnUpdateDeltasGD(net);
														
 
															+        input += inputs;
														
 
															+        desidered += outputs;
														
 
															+        AnnAdjustWeights(net,setlen);
														
 
															+    }
														
 
															+    return error / setlen;
														
 
															+}
														
 
															+
														
 
															+/* This function, called after AnnSimulate(), will return 1 if there is
														
 
															+ * an error in the detected class (compared to the desired output),
														
 
															+ * othewise 0 is returned. */
														
 
															+int AnnTestClassError(AnnRprop *net, ann_float_t *desired) {
														
 
															+    int i, outputs = ANN_OUTPUT_UNITS(net);
														
 
															+    int classid, outid;
														
 
															+    ann_float_t max = 0;
														
 
															+
														
 
															+    /* Get the class ID from the test dataset output. */
														
 
															+    classid = 0;
														
 
															+    for (i = 0; i < outputs; i++)
														
 
															+        if (desired[i] == 1) break;
														
 
															+    classid = i;
														
 
															+
														
 
															+    /* Get the network classification. */
														
 
															+    max = ANN_OUTPUT_NODE(net,0);
														
 
															+    outid = 0;
														
 
															+    for (i = 1; i < outputs; i++) {
														
 
															+        ann_float_t o = ANN_OUTPUT_NODE(net,i);
														
 
															+        if (o > max) {
														
 
															+            outid = i;
														
 
															+            max = o;
														
 
															+        }
														
 
															+    }
														
 
															+    return outid != classid;
														
 
															+}
														
 
															+
														
 
															+/* Simulate the entire test dataset with the neural network and returns the
														
 
															+ * average error of all the entries tested. */
														
 
															+void AnnTestError(AnnRprop *net, ann_float_t *input, ann_float_t *desired, int setlen, ann_float_t *avgerr, ann_float_t *classerr) {
														
 
															+    ann_float_t error = 0;
														
 
															+    int j, inputs = ANN_INPUT_UNITS(net), outputs = ANN_OUTPUT_UNITS(net);
														
 
															+    int class_errors = 0;
														
 
															+
														
 
															+    for (j = 0; j < setlen; j++) {
														
 
															+        error += AnnSimulateError(net, input, desired);
														
 
															+        if (classerr)
														
 
															+            class_errors += AnnTestClassError(net, desired);
														
 
															+        input += inputs;
														
 
															+        desired += outputs;
														
 
															+    }
														
 
															+    if (avgerr) *avgerr = error/setlen;
														
 
															+    if (classerr) *classerr = (ann_float_t)class_errors*100/setlen;
														
 
															+}
														
 
															+
														
 
															+/* Train the net */
														
 
															+ann_float_t AnnTrainWithAlgoFunc(AnnRprop *net, ann_float_t *input, ann_float_t *desired, ann_float_t maxerr,
														
 
															+                                        int maxepochs, int setlen, AnnTrainAlgoFunc algo_func) {
														
 
															+    int i = 0;
														
 
															+    ann_float_t e = maxerr+1;
														
 
															+
														
 
															+    while (i++ < maxepochs && e >= maxerr) {
														
 
															+        e = (*algo_func)(net, input, desired, setlen);
														
 
															+    }
														
 
															+    return e;
														
 
															+}
														
 
															+
														
 
															+
														
 
															+ann_float_t AnnTrain(AnnRprop *net, ann_float_t *input, ann_float_t *desired, ann_float_t maxerr, int maxepochs,
														
 
															+                                                                                int setlen, int algo) {
														
 
															+    AnnTrainAlgoFunc algo_func;
														
 
															+    if(algo == ANN_ALGO_BPROP) algo_func = AnnResilientBPEpoch;
														
 
															+    else if(algo == ANN_ALGO_GD) algo_func = AnnGDEpoch;
														
 
															+    else return -1;
														
 
															+
														
 
															+    return AnnTrainWithAlgoFunc(net, input, desired, maxerr, maxepochs, setlen, algo_func);
														
 
															+}
														
--- a/SquiLu-ext/nn.h
+++ b/SquiLu-ext/nn.h
@@ -0,0 +1,160 @@
 
															+/* RPROP Neural Networks implementation
														
 
															+ * See: http://deeplearning.cs.cmu.edu/pdfs/Rprop.pdf
														
 
															+ *
														
 
															+ * Copyright (c) 2003-2016, Salvatore Sanfilippo <antirez at gmail dot com>
														
 
															+ * All rights reserved.
														
 
															+ *
														
 
															+ * Redistribution and use in source and binary forms, with or without
														
 
															+ * modification, are permitted provided that the following conditions are met:
														
 
															+ *
														
 
															+ *   * Redistributions of source code must retain the above copyright notice,
														
 
															+ *     this list of conditions and the following disclaimer.
														
 
															+ *   * Redistributions in binary form must reproduce the above copyright
														
 
															+ *     notice, this list of conditions and the following disclaimer in the
														
 
															+ *     documentation and/or other materials provided with the distribution.
														
 
															+ *   * Neither the name of Disque nor the names of its contributors may be used
														
 
															+ *     to endorse or promote products derived from this software without
														
 
															+ *     specific prior written permission.
														
 
															+ *
														
 
															+ * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
														
 
															+ * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
														
 
															+ * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
														
 
															+ * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
														
 
															+ * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
														
 
															+ * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
														
 
															+ * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
														
 
															+ * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
														
 
															+ * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
														
 
															+ * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
														
 
															+ * POSSIBILITY OF SUCH DAMAGE.
														
 
															+ */
														
 
															+
														
 
															+#ifndef __SQNN_H
														
 
															+#define __SQNN_H
														
 
															+
														
 
															+//#include <assert.h>
														
 
															+
														
 
															+typedef float ann_float_t;
														
 
															+typedef ann_float_t (*AnnDerivativeFunc)(ann_float_t v);
														
 
															+
														
 
															+/* Data structures.
														
 
															+ * Nets are not so 'dynamic', but enough to support
														
 
															+ * an arbitrary number of layers, with arbitrary units for layer.
														
 
															+ * Only fully connected feed-forward networks are supported. */
														
 
															+typedef struct {
														
 
															+	ann_float_t *output;		/* output[i], output of i-th unit */
														
 
															+	ann_float_t *error;		/* error[i], output error of i-th unit*/
														
 
															+	ann_float_t *weight;		/* weight[(i*units)+j] */
														
 
															+				/* weight between unit i-th and next j-th */
														
 
															+	ann_float_t *gradient;	/* gradient[(i*units)+j] gradient */
														
 
															+	ann_float_t *sgradient;	/* gradient for the full training set */
														
 
															+				/* only used for RPROP */
														
 
															+	ann_float_t *pgradient;	/* pastgradient[(i*units)+j] t-1 gradient */
														
 
															+				/* (t-1 sgradient for resilient BP) */
														
 
															+	ann_float_t *delta;		/* delta[(i*units)+j] cumulative update */
														
 
															+				/* (per-weight delta for RPROP) */
														
 
															+	int units;	/*moved to last position for alignment purposes*/
														
 
															+	int units_aligned; /*units rounded up for alignment*/
														
 
															+} AnnLayer;
														
 
															+
														
 
															+/* Feed forward network structure */
														
 
															+typedef struct {
														
 
															+	AnnLayer *layer;
														
 
															+	int flags;
														
 
															+	int layers;
														
 
															+	AnnDerivativeFunc node_transf_func;
														
 
															+	AnnDerivativeFunc derivative_func;
														
 
															+	ann_float_t rprop_nminus;
														
 
															+	ann_float_t rprop_nplus;
														
 
															+	ann_float_t rprop_maxupdate;
														
 
															+	ann_float_t rprop_minupdate;
														
 
															+	ann_float_t learn_rate; /* Used for GD training. */
														
 
															+} AnnRprop;
														
 
															+
														
 
															+typedef ann_float_t (*AnnTrainAlgoFunc)(AnnRprop *net, ann_float_t *input, ann_float_t *desired, int setlen);
														
 
															+
														
 
															+/* Raw interface to data structures */
														
 
															+#define ANN_LAYERS(net) (net)->layers
														
 
															+#define ANN_LAYER(net, l) (net)->layer[/*assert(l >= 0),*/l]
														
 
															+#define ANN_OUTPUT(net,l,i) ANN_LAYER(net, l).output[i]
														
 
															+#define ANN_ERROR(net,l,i) ANN_LAYER(net, l).error[i]
														
 
															+#define ANN_LAYER_IDX(net,l,i,j) (((j)*ANN_LAYER(net, l).units_aligned)+(i))
														
 
															+#define ANN_WEIGHT(net,l,i,j) ANN_LAYER(net, l).weight[ANN_LAYER_IDX(net,l,i,j)]
														
 
															+#define ANN_GRADIENT(net,l,i,j) ANN_LAYER(net, l).gradient[ANN_LAYER_IDX(net,l,i,j)]
														
 
															+#define ANN_SGRADIENT(net,l,i,j) ANN_LAYER(net, l).sgradient[ANN_LAYER_IDX(net,l,i,j)]
														
 
															+#define ANN_PGRADIENT(net,l,i,j) ANN_LAYER(net, l).pgradient[ANN_LAYER_IDX(net,l,i,j)]
														
 
															+#define ANN_DELTA(net,l,i,j) ANN_LAYER(net, l).delta[ANN_LAYER_IDX(net,l,i,j)]
														
 
															+#define ANN_UNITS(net,l) ANN_LAYER(net, l).units
														
 
															+#define ANN_UNITS_ALLOCATED(net,l) ANN_LAYER(net, l).units_aligned
														
 
															+#define ANN_WEIGHTS(net,l) (ANN_UNITS(net,l)*ANN_UNITS(net,l-1))
														
 
															+#define ANN_OUTPUT_NODE(net,i) ANN_OUTPUT(net,0,i)
														
 
															+#define ANN_INPUT_NODE(net,i) ANN_OUTPUT(net,(ANN_LAYERS(net))-1,i)
														
 
															+#define ANN_OUTPUT_UNITS(net) ANN_UNITS(net,0)
														
 
															+#define ANN_INPUT_UNITS(net) (ANN_UNITS(net,(ANN_LAYERS(net))-1)-1)
														
 
															+#define ANN_RPROP_NMINUS(net) (net)->rprop_nminus
														
 
															+#define ANN_RPROP_NPLUS(net) (net)->rprop_nplus
														
 
															+#define ANN_RPROP_MAXUPDATE(net) (net)->rprop_maxupdate
														
 
															+#define ANN_RPROP_MINUPDATE(net) (net)->rprop_minupdate
														
 
															+#define ANN_LEARN_RATE(net) (net)->learn_rate
														
 
															+
														
 
															+/* Constants */
														
 
															+#define ANN_DEFAULT_RPROP_NMINUS 0.5
														
 
															+#define ANN_DEFAULT_RPROP_NPLUS 1.2
														
 
															+#define ANN_DEFAULT_RPROP_MAXUPDATE 50
														
 
															+#define ANN_DEFAULT_RPROP_MINUPDATE 0.000001
														
 
															+#define ANN_RPROP_INITIAL_DELTA 0.1
														
 
															+#define ANN_DEFAULT_LEARN_RATE 0.1
														
 
															+#define ANN_ALGO_BPROP 0
														
 
															+#define ANN_ALGO_GD 1
														
 
															+
														
 
															+/* Misc */
														
 
															+#define ANN_MAX(a,b) (((a)>(b))?(a):(b))
														
 
															+#define ANN_MIN(a,b) (((a)<(b))?(a):(b))
														
 
															+
														
 
															+/* Prototypes */
														
 
															+ann_float_t AnnTransferFunctionSigmoid(ann_float_t x);
														
 
															+ann_float_t AnnTransferFunctionRelu(ann_float_t x);
														
 
															+ann_float_t AnnTransferFunctionTanh(ann_float_t x);
														
 
															+//ann_float_t AnnDerivativeIdentity(ann_float_t x);
														
 
															+ann_float_t AnnDerivativeSigmoid(ann_float_t x);
														
 
															+ann_float_t AnnDerivativeTanh(ann_float_t x);
														
 
															+ann_float_t AnnDerivativeRelu(ann_float_t x);
														
 
															+
														
 
															+void AnnResetLayer(AnnLayer *layer);
														
 
															+AnnRprop *AnnAlloc(int layers);
														
 
															+void AnnFreeLayer(AnnLayer *layer);
														
 
															+void AnnFree(AnnRprop *net);
														
 
															+int AnnInitLayer(AnnRprop *net, int i, int units, int bias);
														
 
															+AnnRprop *AnnCreateNet(int layers, int *units);
														
 
															+AnnRprop *AnnCreateNet2(int iunits, int ounits);
														
 
															+AnnRprop *AnnCreateNet3(int iunits, int hunits, int ounits);
														
 
															+AnnRprop *AnnCreateNet4(int iunits, int hunits, int hunits2, int ounits);
														
 
															+AnnRprop *AnnClone(const AnnRprop* net);
														
 
															+size_t AnnCountWeights(AnnRprop *net);
														
 
															+void AnnSimulate(AnnRprop *net);
														
 
															+void Ann2Tcl(const AnnRprop *net);
														
 
															+void Ann2Js(const AnnRprop *net);
														
 
															+void AnnPrint(const AnnRprop *net);
														
 
															+ann_float_t AnnGlobalError(AnnRprop *net, ann_float_t *desidered);
														
 
															+void AnnSetInput(AnnRprop *net, ann_float_t *input);
														
 
															+ann_float_t AnnSimulateError(AnnRprop *net, ann_float_t *input, ann_float_t *desidered);
														
 
															+void AnnCalculateGradientsTrivial(AnnRprop *net, ann_float_t *desidered);
														
 
															+void AnnCalculateGradients(AnnRprop *net, ann_float_t *desidered);
														
 
															+void AnnSetDeltas(AnnRprop *net, ann_float_t val);
														
 
															+void AnnResetDeltas(AnnRprop *net);
														
 
															+void AnnResetSgradient(AnnRprop *net);
														
 
															+void AnnSetRandomWeights(AnnRprop *net);
														
 
															+void AnnScaleWeights(AnnRprop *net, ann_float_t factor);
														
 
															+void AnnUpdateDeltasGD(AnnRprop *net);
														
 
															+void AnnUpdateDeltasGDM(AnnRprop *net);
														
 
															+void AnnUpdateSgradient(AnnRprop *net);
														
 
															+void AnnAdjustWeights(AnnRprop *net, int setlen);
														
 
															+ann_float_t AnnBatchGDEpoch(AnnRprop *net, ann_float_t *input, ann_float_t *desidered, int setlen);
														
 
															+ann_float_t AnnBatchGDMEpoch(AnnRprop *net, ann_float_t *input, ann_float_t *desidered, int setlen);
														
 
															+void AnnAdjustWeightsResilientBP(AnnRprop *net);
														
 
															+ann_float_t AnnResilientBPEpoch(AnnRprop *net, ann_float_t *input, ann_float_t *desidered, int setlen);
														
 
															+ann_float_t AnnTrainWithAlgoFunc(AnnRprop *net, ann_float_t *input, ann_float_t *desidered, ann_float_t maxerr, int maxepochs, int setlen, AnnTrainAlgoFunc algo_func);
														
 
															+ann_float_t AnnTrain(AnnRprop *net, ann_float_t *input, ann_float_t *desidered, ann_float_t maxerr, int maxepochs, int setlen, int algo);
														
 
															+void AnnTestError(AnnRprop *net, ann_float_t *input, ann_float_t *desired, int setlen, ann_float_t *avgerr, ann_float_t *classerr);
														
 
															+
														
 
															+#endif /* __SQNN_H */
														
--- a/SquiLu-ext/sq_ipc.cpp
+++ b/SquiLu-ext/sq_ipc.cpp
@@ -0,0 +1,522 @@
 
															+#ifdef __cplusplus
														
 
															+extern "C" {
														
 
															+#endif
														
 
															+
														
 
															+//#ifdef USE_IPC
														
 
															+
														
 
															+#include "squirrel.h"
														
 
															+#include <string.h>
														
 
															+#include <stdio.h>
														
 
															+#include <stdlib.h>  /* for malloc */
														
 
															+#include <assert.h>  /* for a few sanity tests */
														
 
															+#include <sqstdio.h>
														
 
															+#include <sqstdfile.h>
														
 
															+
														
 
															+//#include "FileLock.h"
														
 
															+/* check for POSIX */
														
 
															+#if defined( unix ) || defined( __unix ) || defined( __unix__ ) || \
														
 
															+    (defined( __APPLE__ ) && defined( __MACH__ )) || \
														
 
															+    HAVE_UNISTD_H
														
 
															+#  include <unistd.h>
														
 
															+#  if defined( _POSIX_VERSION ) && _POSIX_VERSION >= 200112L
														
 
															+#    define HAVE_FLOCK
														
 
															+#include <stddef.h>
														
 
															+#include <errno.h>
														
 
															+#include <unistd.h>
														
 
															+#include <fcntl.h>
														
 
															+
														
 
															+typedef off_t ipc_flock_off_t;
														
 
															+#  endif
														
 
															+#endif
														
 
															+
														
 
															+
														
 
															+/* check for Windows */
														
 
															+#if !defined( HAVE_FLOCK ) && \
														
 
															+    defined( _WIN32 ) && !defined( __CYGWIN__ )
														
 
															+#  define HAVE_FLOCK
														
 
															+#include <stddef.h>
														
 
															+#include <ctype.h>
														
 
															+#define WIN32_LEAN_AND_MEAN
														
 
															+#include <windows.h>
														
 
															+#include <io.h>
														
 
															+
														
 
															+
														
 
															+typedef ULONGLONG ipc_flock_off_t;
														
 
															+#endif
														
 
															+
														
 
															+static int ipc_err( char const* file, int line, char const* func,
														
 
															+                       int code ) {
														
 
															+  if( code != 0 ) {
														
 
															+    if( func != NULL )
														
 
															+      fprintf( stderr, "[%s:%d] error return (%d) in function '%s'\n",
														
 
															+               file, line, code, func );
														
 
															+    else
														
 
															+      fprintf( stderr, "[%s:%d]: error return (%d)\n",
														
 
															+               file, line, code );
														
 
															+    fflush( stderr );
														
 
															+  }
														
 
															+  return code;
														
 
															+}
														
 
															+
														
 
															+#ifndef NDEBUG
														
 
															+#  if (defined( __STDC_VERSION__ ) && __STDC_VERSION__  >= 199901L) || \
														
 
															+      defined( __GNUC__ ) || defined( __clang__ )
														
 
															+#    define IPC_ERR( code ) (ipc_err( __FILE__, __LINE__, __func__, (int)(code) ))
														
 
															+#  elif defined( _MSC_VER ) && _MSC_VER >= 1100L
														
 
															+#    define IPC_ERR( code ) (ipc_err( __FILE__, __LINE__, __FUNCTION__, (int)(code) ))
														
 
															+#  else
														
 
															+#    define IPC_ERR( code ) (ipc_err( __FILE__, __LINE__, NULL, (int)(code) ))
														
 
															+#  endif
														
 
															+#else
														
 
															+#  define IPC_ERR( code ) ((int)(code))
														
 
															+#endif
														
 
															+
														
 
															+#define IPC_EINTR( _rv, _call ) \
														
 
															+  do { \
														
 
															+    _rv = _call; \
														
 
															+  } while( _rv < 0 && errno == EINTR )
														
 
															+
														
 
															+#if 0
														
 
															+//memmap
														
 
															+#include <stddef.h>
														
 
															+#include <limits.h>
														
 
															+#include <string.h>
														
 
															+#include <errno.h>
														
 
															+#include <sys/types.h>
														
 
															+#include <sys/mman.h>
														
 
															+#include <sys/stat.h>
														
 
															+#include <unistd.h>
														
 
															+#include <fcntl.h>
														
 
															+
														
 
															+
														
 
															+typedef off_t ipc_mmap_off_t;
														
 
															+
														
 
															+#define MEMFILE_R  1
														
 
															+#define MEMFILE_W  2
														
 
															+#define MEMFILE_RW (MEMFILE_R|MEMFILE_W)
														
 
															+
														
 
															+typedef struct {
														
 
															+  void* addr;
														
 
															+  size_t len;
														
 
															+} ipc_mmap_handle;
														
 
															+
														
 
															+static void* ipc_mmap_addr( ipc_mmap_handle* h ) {
														
 
															+  return h->addr;
														
 
															+}
														
 
															+
														
 
															+static size_t ipc_mmap_size( ipc_mmap_handle* h ) {
														
 
															+  return h->len;
														
 
															+}
														
 
															+
														
 
															+
														
 
															+static void ipc_mmap_error( char* buf, size_t len, int code ) {
														
 
															+  if( len > 0 && strerror_r( code, buf, len ) != (int)0 ) {
														
 
															+    strncpy( buf, "unknown error", len-1 );
														
 
															+    buf[ len-1 ] = '\0';
														
 
															+  }
														
 
															+}
														
 
															+
														
 
															+
														
 
															+static size_t ipc_mmap_pagesize( void ) {
														
 
															+  long result = sysconf( _SC_PAGESIZE );
														
 
															+  if( result < 1 )
														
 
															+    result = 4096;
														
 
															+  return (size_t)result;
														
 
															+}
														
 
															+
														
 
															+
														
 
															+static int ipc_mmap_open( ipc_mmap_handle* h, char const* name,
														
 
															+                          int mode, off_t offset, size_t size ) {
														
 
															+  int fd, oflags = 0, mmflags = 0;
														
 
															+  if( (mode & MEMFILE_RW) == MEMFILE_RW ) {
														
 
															+    oflags = O_RDWR;
														
 
															+    mmflags = PROT_READ | PROT_WRITE;
														
 
															+  } else if( mode & MEMFILE_R ) {
														
 
															+    oflags = O_RDONLY;
														
 
															+    mmflags = PROT_READ;
														
 
															+  } else if( mode & MEMFILE_W ) {
														
 
															+    oflags = O_RDWR;
														
 
															+    mmflags = PROT_WRITE;
														
 
															+  }
														
 
															+#ifdef O_CLOEXEC
														
 
															+  oflags |= O_CLOEXEC;
														
 
															+#endif
														
 
															+  fd = open( name, oflags );
														
 
															+  if( fd < 0 )
														
 
															+    return IPC_ERR( errno );
														
 
															+  h->len = size;
														
 
															+  if( size == 0 ) { /* figure out its size */
														
 
															+    struct stat buf;
														
 
															+    if( fstat( fd, &buf ) < 0 ) {
														
 
															+      int saved_errno = errno;
														
 
															+      close( fd );
														
 
															+      return IPC_ERR( saved_errno );
														
 
															+    }
														
 
															+    if( buf.st_size < offset ) {
														
 
															+      close( fd );
														
 
															+      return IPC_ERR( EINVAL );
														
 
															+    }
														
 
															+    if( buf.st_size - offset > (size_t)-1 )
														
 
															+      h->len = (size_t)-1;
														
 
															+    else
														
 
															+      h->len = buf.st_size - offset;
														
 
															+  }
														
 
															+  /* create mmap */
														
 
															+  h->addr = mmap( NULL, h->len, mmflags, MAP_SHARED, fd, offset );
														
 
															+  if( h->addr == MAP_FAILED ) {
														
 
															+    int saved_errno = errno;
														
 
															+    close( fd );
														
 
															+    return IPC_ERR( saved_errno );
														
 
															+  }
														
 
															+  close( fd ); /* we don't need it anymore! */
														
 
															+  return 0;
														
 
															+}
														
 
															+
														
 
															+
														
 
															+static int ipc_mmap_close( ipc_mmap_handle* h ) {
														
 
															+  int rv = munmap( h->addr, h->len );
														
 
															+  if( rv < 0 )
														
 
															+    return IPC_ERR( errno );
														
 
															+  return 0;
														
 
															+}
														
 
															+
														
 
															+
														
 
															+#if defined( _POSIX_SYNCHRONIZED_IO ) && _POSIX_SYNCHRONIZED_IO > 0
														
 
															+#  define IPC_MMAP_HAVE_FLUSH
														
 
															+static int ipc_mmap_flush( ipc_mmap_handle* h, size_t pos ) {
														
 
															+  int rv = msync( h->addr, pos, MS_ASYNC|MS_INVALIDATE );
														
 
															+  if( rv < 0 )
														
 
															+    return IPC_ERR( errno );
														
 
															+  return 0;
														
 
															+}
														
 
															+#endif
														
 
															+
														
 
															+//#ifdef HAVE_MMAP
														
 
															+
														
 
															+#define NAME "ipc.mmap"
														
 
															+
														
 
															+typedef struct {
														
 
															+  ipc_mmap_handle h; /* platform specific data */
														
 
															+  /* extra management info: */
														
 
															+  char is_valid;
														
 
															+} sq_mmap_handle;
														
 
															+
														
 
															+
														
 
															+static SQRESULT mmap_pusherror( HSQUIRRELVM v, int code ) {
														
 
															+  char buf[ IPC_MAXERRMSG ];
														
 
															+  ipc_mmap_error( buf, sizeof( buf ), code );
														
 
															+  return sq_throwerror(v, _SC("%s"), buf);
														
 
															+}
														
 
															+
														
 
															+
														
 
															+static SQRESULT sq_mmap_close(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS(v);
														
 
															+	GET_file_INSTANCE();
														
 
															+    int rv = 0;
														
 
															+    if(!self->is_valid) return sq_throwerror(v, _SC("attempt to use invalid mmap object"));
														
 
															+    rv = ipc_mmap_close( &self->h );
														
 
															+    if( rv != 0 ) return mmap_pusherror(v, rv);
														
 
															+    self->is_valid = 0;
														
 
															+    sq_pushbool(v, SQTrue);
														
 
															+    return 1;
														
 
															+}
														
 
															+
														
 
															+
														
 
															+static SQRESULT sq_mmap_gc( HSQUIRRELVM v ) {
														
 
															+  l_mmap_handle* h = lua_touserdata( L, 1 );
														
 
															+  if( h->is_valid )
														
 
															+    ipc_mmap_close( &h->h );
														
 
															+  return 0;
														
 
															+}
														
 
															+
														
 
															+
														
 
															+#ifdef IPC_MMAP_HAVE_FLUSH
														
 
															+static SQRESULT sq_mmap_flush( HSQUIRRELVM v ) {
														
 
															+	SQ_FUNC_VARS(v);
														
 
															+	GET_file_INSTANCE();
														
 
															+	SQ_GET_INTEGER(v, 2, pos);
														
 
															+    int rv = 0;
														
 
															+    if( !self->is_valid ) return sq_throwerror(v, _SC("attempt to use invalid mmap object"));
														
 
															+    rv = ipc_mmap_flush( &self->h, pos );
														
 
															+    if( rv != 0 ) return mmap_pusherror(v, rv);
														
 
															+    sq_pushbool(v, SQTrue);
														
 
															+    return 1;
														
 
															+}
														
 
															+#endif
														
 
															+
														
 
															+static SQRESULT getMmapMode(HSQUIRRELVM v, const char *mode)
														
 
															+{
														
 
															+    if(mode)
														
 
															+    {
														
 
															+        switch(mode[0])
														
 
															+        {
														
 
															+        case 'r':
														
 
															+            if(mode[1] == 'w') return MEMFILE_RW;
														
 
															+            return MEMFILE_R;
														
 
															+        break;
														
 
															+
														
 
															+        case 'w':
														
 
															+            return MEMFILE_W;
														
 
															+            break;
														
 
															+        }
														
 
															+    }
														
 
															+    return sq_throwerror(v, _SC("invalid parameter mode '%s'"), mode);;
														
 
															+}
														
 
															+
														
 
															+
														
 
															+static SQRESULT sq_mmap_open(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS(v);
														
 
															+	GET_file_INSTANCE();
														
 
															+
														
 
															+	SQ_GET_STRING(v, 2, name);
														
 
															+	SQ_GET_STRING(v, 3, mode);
														
 
															+	SQ_OPT_INTEGER(v, 4, offset, 0);
														
 
															+	SQ_OPT_INTEGER(v, 5, nbytes, 0);
														
 
															+
														
 
															+    int mmode = getMmapMode(v, mode);
														
 
															+    if(mmode < 0) return mmode;
														
 
															+    ipc_mmap_off_t offset = offset;
														
 
															+    size_t size = nbytes;
														
 
															+    l_mmap_handle* h = lua_newuserdata( L, sizeof( *h ) );
														
 
															+    int rv = 0;
														
 
															+    h->is_valid = 0;
														
 
															+    luaL_getmetatable( L, NAME );
														
 
															+    lua_setmetatable( L, -2 );
														
 
															+    rv = ipc_mmap_open( &h->h, name, mode, offset, size );
														
 
															+    if( rv != 0 ) return mmap_pusherror( L, rv );
														
 
															+    h->is_valid = 1;
														
 
															+    sq_pushcfunction(v, sq_mmap_close );
														
 
															+#ifdef IPC_MMAP_HAVE_FLUSH
														
 
															+    sq_pushcfunction(v, l_mmap_flush );
														
 
															+    memfile_new( L, ipc_mmap_addr( &h->h ), ipc_mmap_size( &h->h ),
														
 
															+               mode, -3, -2, -1 );
														
 
															+#else
														
 
															+    memfile_new( L, ipc_mmap_addr( &h->h ), ipc_mmap_size( &h->h ),
														
 
															+               mode, -2, -1, 0 );
														
 
															+#endif
														
 
															+  return 1;
														
 
															+}
														
 
															+
														
 
															+//#endif // HAVE_MMAP
														
 
															+#endif // 0
														
 
															+
														
 
															+//file lock
														
 
															+static void ipc_flock_error( char* buf, size_t len, int code ) {
														
 
															+#ifdef _WIN32
														
 
															+    if( len > 0 ) {
														
 
															+        if( 0 == FormatMessageA( FORMAT_MESSAGE_FROM_SYSTEM |
														
 
															+                                 FORMAT_MESSAGE_IGNORE_INSERTS,
														
 
															+                                 NULL,
														
 
															+                                 code,
														
 
															+                                 0,
														
 
															+                                 buf,
														
 
															+                                 len,
														
 
															+                                 NULL ) ) {
														
 
															+              strncpy( buf, "unknown error", len-1 );
														
 
															+              buf[ len-1 ] = '\0';
														
 
															+        } else { /* Windows puts an extra newline in there! */
														
 
															+              size_t n = strlen( buf );
														
 
															+              while( n > 0 && isspace( (unsigned char)buf[ --n ] ) )
														
 
															+                buf[ n ] = '\0';
														
 
															+        }
														
 
															+    }
														
 
															+#else
														
 
															+    if( len > 0 && strerror_r( code, buf, len ) != (int)0 ) {
														
 
															+        strncpy( buf, "unknown error", len-1 );
														
 
															+        buf[ len-1 ] = '\0';
														
 
															+    }
														
 
															+#endif // _WIN32
														
 
															+}
														
 
															+
														
 
															+
														
 
															+static int ipc_flock_lock( FILE* f, int is_wlock, int* could_lock,
														
 
															+                           ipc_flock_off_t start,
														
 
															+                           ipc_flock_off_t len ) {
														
 
															+#ifdef _WIN32
														
 
															+    HANDLE fh = (HANDLE)_get_osfhandle( _fileno( f ) );
														
 
															+    DWORD flags = is_wlock ? LOCKFILE_EXCLUSIVE_LOCK : 0;
														
 
															+    DWORD lenlo = (DWORD)len, lenhi = (DWORD)(len >> 32);
														
 
															+    OVERLAPPED ov;
														
 
															+    if( fh == (HANDLE)INVALID_HANDLE_VALUE ) return IPC_ERR( ERROR_INVALID_HANDLE );
														
 
															+    if( could_lock != NULL ) flags |= LOCKFILE_FAIL_IMMEDIATELY;
														
 
															+    ov.Offset = (DWORD)start;
														
 
															+    ov.OffsetHigh = (DWORD)(start >> 32);
														
 
															+    ov.hEvent = NULL;
														
 
															+    if( len == 0 ) lenhi = lenlo = (DWORD)-1;
														
 
															+    if( !LockFileEx( fh, flags, 0, lenlo, lenhi, &ov ) ) {
														
 
															+        int code = GetLastError();
														
 
															+        if( could_lock != NULL && (code == ERROR_LOCK_VIOLATION || code == ERROR_IO_PENDING) )
														
 
															+        {
														
 
															+            *could_lock = 0;
														
 
															+            return 0;
														
 
															+        }
														
 
															+        return IPC_ERR( code );
														
 
															+    }
														
 
															+#else
														
 
															+    int rv = 0;
														
 
															+    int fd = fileno( f );
														
 
															+    int op = could_lock != NULL ? F_SETLK : F_SETLKW;
														
 
															+    struct flock fl;
														
 
															+    fl.l_type = is_wlock ? F_WRLCK : F_RDLCK;
														
 
															+    fl.l_whence = SEEK_SET;
														
 
															+    fl.l_start = start;
														
 
															+    fl.l_len = len;
														
 
															+    IPC_EINTR( rv, fcntl( fd, op, &fl ) );
														
 
															+    if( rv < 0 ) {
														
 
															+        if( could_lock != NULL && (errno == EACCES || errno == EAGAIN) ) {
														
 
															+            *could_lock = 0;
														
 
															+            return 0;
														
 
															+        }
														
 
															+        return IPC_ERR( errno );
														
 
															+    }
														
 
															+#endif
														
 
															+    if( could_lock != NULL ) *could_lock = 1;
														
 
															+    return 0;
														
 
															+}
														
 
															+
														
 
															+
														
 
															+static int ipc_flock_unlock( FILE* f, ipc_flock_off_t start,
														
 
															+                             ipc_flock_off_t len ) {
														
 
															+#ifdef _WIN32
														
 
															+    HANDLE fh = (HANDLE)_get_osfhandle( _fileno( f ) );
														
 
															+    DWORD lenlo = (DWORD)len, lenhi = (DWORD)(len >> 32);
														
 
															+    DWORD offlo = (DWORD)start, offhi = (DWORD)(start >> 32);
														
 
															+    if( fh == (HANDLE)INVALID_HANDLE_VALUE ) return IPC_ERR( ERROR_INVALID_HANDLE );
														
 
															+    if( len == 0 ) lenhi = lenlo = (DWORD)-1;
														
 
															+    if( !UnlockFile( fh, offlo, offhi, lenlo, lenhi ) ) return IPC_ERR( GetLastError() );
														
 
															+#else
														
 
															+    struct flock fl;
														
 
															+    fl.l_type = F_UNLCK;
														
 
															+    fl.l_whence = SEEK_SET;
														
 
															+    fl.l_start = start;
														
 
															+    fl.l_len = len;
														
 
															+    if( fcntl( fileno( f ), F_SETLK, &fl ) < 0 ) return IPC_ERR( errno );
														
 
															+#endif // _WIN32
														
 
															+    return 0;
														
 
															+}
														
 
															+
														
 
															+/* maximum expected length of error messages */
														
 
															+#define IPC_MAXERRMSG 200
														
 
															+
														
 
															+static SQRESULT flock_pusherror(HSQUIRRELVM v, int code) {
														
 
															+  char buf[ IPC_MAXERRMSG ];
														
 
															+  ipc_flock_error( buf, sizeof( buf ), code );
														
 
															+  return sq_throwerror(v, _SC("%s"), buf);
														
 
															+}
														
 
															+
														
 
															+static void invalidate_input_buffer( FILE* f ) {
														
 
															+  /* Linux (and apparently many other implementations) discard
														
 
															+   * unread characters from the input buffer if fflush is called on
														
 
															+   * an input file, but this is not guaranteed by ISO C. */
														
 
															+  fflush( f );
														
 
															+  /* This should also invalidate the input buffer unless the
														
 
															+   * implementation checks for that specific case. */
														
 
															+  fseek( f, 0, SEEK_CUR );
														
 
															+  /* If both methods don't work, we are out of luck. But using
														
 
															+   * low-level file locking with buffered IO is a bad idea
														
 
															+   * anyway! */
														
 
															+}
														
 
															+
														
 
															+SQ_OPT_STRING_STRLEN();
														
 
															+
														
 
															+#define GET_file_INSTANCE() SQ_GET_INSTANCE(v, 1, SQFile, SQSTD_FILE_TYPE_TAG) \
														
 
															+	if(self == NULL) return sq_throwerror(v, _SC("file object already closed"));
														
 
															+
														
 
															+
														
 
															+static SQRESULT getFlockMode(HSQUIRRELVM v, const char *mode)
														
 
															+{
														
 
															+    if(mode)
														
 
															+    {
														
 
															+        switch(mode[0])
														
 
															+        {
														
 
															+        case 'r':
														
 
															+            if(mode[1] == 'w') return 1;
														
 
															+            return 0;
														
 
															+        break;
														
 
															+
														
 
															+        case 'w':
														
 
															+            return 1;
														
 
															+            break;
														
 
															+        }
														
 
															+    }
														
 
															+    return sq_throwerror(v, _SC("invalid parameter mode '%s'"), mode);;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_FileLock_lock0(HSQUIRRELVM v, int isTry){
														
 
															+	SQ_FUNC_VARS(v);
														
 
															+	GET_file_INSTANCE();
														
 
															+
														
 
															+	SQ_GET_STRING(v, 2, mode);
														
 
															+	SQ_OPT_INTEGER(v, 3, offset, 0);
														
 
															+	SQ_OPT_INTEGER(v, 4, nbytes, 0);
														
 
															+
														
 
															+    FILE *fp = (FILE*)self->GetHandle();
														
 
															+    int is_wlock = getFlockMode(v, mode);
														
 
															+    if(is_wlock < 0) return is_wlock;
														
 
															+    ipc_flock_off_t start = offset;
														
 
															+    ipc_flock_off_t len = nbytes;
														
 
															+    int could_lock = isTry ? 0 : 1;
														
 
															+    int rv = ipc_flock_lock(fp, (isTry ? is_wlock : 0), &could_lock, start, len);
														
 
															+    if( rv != 0 ) return flock_pusherror(v, rv);
														
 
															+    /* try to flush input buffer */
														
 
															+    if(could_lock) invalidate_input_buffer(fp);
														
 
															+    sq_pushbool(v, could_lock);
														
 
															+    return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_FileLock_lock(HSQUIRRELVM v){
														
 
															+    return sq_FileLock_lock0(v, 0);
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_FileLock_trylock(HSQUIRRELVM v){
														
 
															+    return sq_FileLock_lock0(v, 1);
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_FileLock_unlock(HSQUIRRELVM v){
														
 
															+	SQ_FUNC_VARS(v);
														
 
															+	GET_file_INSTANCE();
														
 
															+
														
 
															+	SQ_OPT_INTEGER(v, 2, offset, 0);
														
 
															+	SQ_OPT_INTEGER(v, 3, nbytes, 0);
														
 
															+
														
 
															+    FILE *fp = (FILE*)self->GetHandle();
														
 
															+    ipc_flock_off_t start = offset;
														
 
															+    ipc_flock_off_t len = nbytes;
														
 
															+    int rv = 0;
														
 
															+    fflush(fp); /* flush output buffer */
														
 
															+    rv = ipc_flock_unlock(fp, start, len);
														
 
															+    if( rv != 0 ) return flock_pusherror(v, rv);
														
 
															+    sq_pushbool(v, SQTrue);
														
 
															+    return 1;
														
 
															+}
														
 
															+
														
 
															+#define _DECL_FILELOCK_FUNC(name,nparams,pmask) {_SC(#name),sq_FileLock_##name,nparams,pmask}
														
 
															+static SQRegFunction FileLock_obj_funcs[]={
														
 
															+	_DECL_FILELOCK_FUNC(lock, -2, _SC("xsii")),
														
 
															+	_DECL_FILELOCK_FUNC(trylock, -2, _SC("xsii")),
														
 
															+	_DECL_FILELOCK_FUNC(unlock, -1, _SC("x")),
														
 
															+	{0,0}
														
 
															+};
														
 
															+#undef _DECL_FILELOCK_FUNC
														
 
															+
														
 
															+/* This defines a function that opens up your library. */
														
 
															+SQRESULT sqext_register_ipc (HSQUIRRELVM v) {
														
 
															+	//add a namespace FileLock
														
 
															+    sq_pushstring(v, SQSTD_FILE_CLASS_TYPE_TAG, -1);
														
 
															+    if(sq_getonregistrytable(v) == SQ_OK){
														
 
															+        sq_insert_reg_funcs(v, FileLock_obj_funcs);
														
 
															+        sq_poptop(v);
														
 
															+        return SQ_OK;
														
 
															+    }
														
 
															+    return sq_throwerror(v, _SC("file class not found"));
														
 
															+}
														
 
															+
														
 
															+#ifdef __cplusplus
														
 
															+}
														
 
															+
														
 
															+//#endif //USE_IPC
														
 
															+
														
 
															+#endif
														
 
															+
														
--- a/SquiLu-ext/sq_lpsolve.cpp
+++ b/SquiLu-ext/sq_lpsolve.cpp
@@ -0,0 +1,557 @@
 
															+#if defined(SQ_USE_LPSOLVE) || defined(SQ_USE_LPSOLVE_STATIC)
														
 
															+
														
 
															+#include <ctype.h>
														
 
															+#include <string.h>
														
 
															+#include <stdio.h>
														
 
															+
														
 
															+#include "squirrel.h"
														
 
															+#include "sqstdblobimpl.h"
														
 
															+
														
 
															+#include "lp_lib.h"
														
 
															+
														
 
															+////////
														
 
															+#include "dynamic_library.h"
														
 
															+
														
 
															+/*SquiLu
														
 
															+
														
 
															+local library_functions = [
														
 
															+    ["void", "lp_solve_version", "int *majorversion, int *minorversion, int *release, int *build"],
														
 
															+    ["lprec*", "make_lp", "int rows, int columns"],
														
 
															+    ["MYBOOL", "resize_lp", "lprec *lp, int rows, int columns"],
														
 
															+    ["lprec*", "read_LP", "char *filename, int verbose, char *lp_name"],
														
 
															+    ["lprec*", "read_MPS", "char *filename, int options"],
														
 
															+    ["lprec*", "read_freeMPS", "char *filename, int options"],
														
 
															+    ["void", "delete_lp", "lprec *plp"],
														
 
															+
														
 
															+    //next entry should be the last one
														
 
															+    //to make valid the test made on load_library function
														
 
															+    ["void", "free_lp", "lprec **plp"],
														
 
															+];
														
 
															+
														
 
															+function write_library_functions_declaration(){
														
 
															+    foreach(k,v in library_functions) {
														
 
															+        putsnl("typedef " + v[0] + " (*" + v[1] + "_t)(" + v[2] + ");");
														
 
															+        putsnl("static " + v[1] + "_t dl" + v[1] + " = 0;");
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+function write_library_functions_load(){
														
 
															+    foreach(k,v in library_functions){
														
 
															+        putsnl("dl" + v[1] + " = (" + v[1] + "_t) libdyn.dlsym(\"" + v[1] + "\");");
														
 
															+        putsnl("if(!dl" + v[1] + ") return false;");
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+function write_library_functions_static_defines(){
														
 
															+    foreach(k,v in library_functions){
														
 
															+        putsnl("#define dl" + v[1] + " " + v[1]);
														
 
															+    }
														
 
															+}
														
 
															+SquiLu*/
														
 
															+
														
 
															+#ifdef SQ_USE_LPSOLVE_STATIC
														
 
															+
														
 
															+#define load_library(x) true
														
 
															+
														
 
															+//@write_library_functions_static_defines()
														
 
															+// generated-code:begin
														
 
															+#define dllp_solve_version lp_solve_version
														
 
															+#define dlmake_lp make_lp
														
 
															+#define dlresize_lp resize_lp
														
 
															+#define dlread_LP read_LP
														
 
															+#define dlread_MPS read_MPS
														
 
															+#define dlread_freeMPS read_freeMPS
														
 
															+#define dldelete_lp delete_lp
														
 
															+#define dlfree_lp free_lp
														
 
															+// generated-code:end
														
 
															+
														
 
															+#else
														
 
															+
														
 
															+static DynamicLibrary libdyn;
														
 
															+
														
 
															+//@write_library_functions_declaration();
														
 
															+// generated-code:begin
														
 
															+typedef void (*lp_solve_version_t)(int *majorversion, int *minorversion, int *release, int *build);
														
 
															+static lp_solve_version_t dllp_solve_version = 0;
														
 
															+typedef lprec* (*make_lp_t)(int rows, int columns);
														
 
															+static make_lp_t dlmake_lp = 0;
														
 
															+typedef MYBOOL (*resize_lp_t)(lprec *lp, int rows, int columns);
														
 
															+static resize_lp_t dlresize_lp = 0;
														
 
															+typedef lprec* (*read_LP_t)(char *filename, int verbose, char *lp_name);
														
 
															+static read_LP_t dlread_LP = 0;
														
 
															+typedef lprec* (*read_MPS_t)(char *filename, int options);
														
 
															+static read_MPS_t dlread_MPS = 0;
														
 
															+typedef lprec* (*read_freeMPS_t)(char *filename, int options);
														
 
															+static read_freeMPS_t dlread_freeMPS = 0;
														
 
															+typedef void (*delete_lp_t)(lprec *plp);
														
 
															+static delete_lp_t dldelete_lp = 0;
														
 
															+typedef void (*free_lp_t)(lprec **plp);
														
 
															+static free_lp_t dlfree_lp = 0;
														
 
															+// generated-code:end
														
 
															+
														
 
															+static const char *dynamicLibName = DYNLIB_FOR_OS(liblpsolve55);
														
 
															+
														
 
															+static bool load_library(const char *libname)
														
 
															+{
														
 
															+    if(dlfree_lp) return true;
														
 
															+    if(libdyn.open(libname))
														
 
															+    {
														
 
															+        //@write_library_functions_load();
														
 
															+// generated-code:begin
														
 
															+dllp_solve_version = (lp_solve_version_t) libdyn.dlsym("lp_solve_version");
														
 
															+if(!dllp_solve_version) return false;
														
 
															+dlmake_lp = (make_lp_t) libdyn.dlsym("make_lp");
														
 
															+if(!dlmake_lp) return false;
														
 
															+dlresize_lp = (resize_lp_t) libdyn.dlsym("resize_lp");
														
 
															+if(!dlresize_lp) return false;
														
 
															+dlread_LP = (read_LP_t) libdyn.dlsym("read_LP");
														
 
															+if(!dlread_LP) return false;
														
 
															+dlread_MPS = (read_MPS_t) libdyn.dlsym("read_MPS");
														
 
															+if(!dlread_MPS) return false;
														
 
															+dlread_freeMPS = (read_freeMPS_t) libdyn.dlsym("read_freeMPS");
														
 
															+if(!dlread_freeMPS) return false;
														
 
															+dldelete_lp = (delete_lp_t) libdyn.dlsym("delete_lp");
														
 
															+if(!dldelete_lp) return false;
														
 
															+dlfree_lp = (free_lp_t) libdyn.dlsym("free_lp");
														
 
															+if(!dlfree_lp) return false;
														
 
															+// generated-code:end
														
 
															+
														
 
															+        return true;
														
 
															+    }
														
 
															+    return false;
														
 
															+}
														
 
															+
														
 
															+#endif // SQ_USE_LPSOLVE_STATIC
														
 
															+
														
 
															+SQ_OPT_STRING_STRLEN();
														
 
															+
														
 
															+static const SQChar LPSOLVE_Tag[]   = _SC("SQLPSolve");
														
 
															+#define GET_lpsolve_INSTANCE() SQ_GET_INSTANCE(v, 1, lprec, LPSOLVE_Tag) \
														
 
															+	if(self == NULL) return sq_throwerror(v, _SC("sqlpsolve object already closed"));
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_releasehook(SQUserPointer p, SQInteger /*size*/, void */*ep*/)
														
 
															+{
														
 
															+	lprec *self = ((lprec *)p);
														
 
															+	if(self)
														
 
															+    {
														
 
															+        dldelete_lp(self);
														
 
															+    }
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_constructor(HSQUIRRELVM v)
														
 
															+{
														
 
															+    if(!load_library(dynamicLibName)) return sq_throwerror(v, _SC("Failed to load liblpsolve !"));
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+	SQ_GET_INTEGER(v, 2, constraints);
														
 
															+	SQ_GET_INTEGER(v, 3, variables);
														
 
															+
														
 
															+    lprec *self = dlmake_lp(constraints, variables);
														
 
															+
														
 
															+	sq_setinstanceup(v,1,self);
														
 
															+	sq_setreleasehook(v,1,sq_lpsolve_releasehook);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_version(HSQUIRRELVM v)
														
 
															+{
														
 
															+    int majorversion, minorversion, release, build;
														
 
															+    dllp_solve_version(&majorversion, &minorversion, &release, &build);
														
 
															+	sq_pushfstring(v,_SC("lp_solve %d.%d.%d.%d"), majorversion, minorversion, release, build);
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_loadlib(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    SQ_GET_STRING(v, 2, libname);
														
 
															+    sq_pushbool(v, load_library(libname));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_set_verbose(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_INTEGER(v, 2, mode);
														
 
															+	//dlset_verbose(self, mode);
														
 
															+	self->set_verbose(self, mode);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_set_obj_fn(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+    const SQInteger ary_idx = 2;
														
 
															+    if(sq_gettype(v, ary_idx) == OT_ARRAY)
														
 
															+    {
														
 
															+        SQInteger atype;
														
 
															+        if(sq_arraygettype(v, ary_idx, &atype) != SQ_OK && atype == eat_SQFloat64Array) return sq_throwerror(v, _SC("SQFloat64Array expected"));
														
 
															+        void *ary;
														
 
															+        sq_arraygetrawdata(v, ary_idx, &ary);
														
 
															+        sq_pushbool(v, self->set_obj_fn(self, (REAL*)ary));
														
 
															+    }
														
 
															+    else sq_pushbool(v, SQFalse);
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_add_constraint(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+    const SQInteger ary_idx = 2;
														
 
															+    if(sq_gettype(v, ary_idx) == OT_ARRAY)
														
 
															+    {
														
 
															+        SQInteger atype;
														
 
															+        if(sq_arraygettype(v, ary_idx, &atype) != SQ_OK && atype == eat_SQFloat64Array) return sq_throwerror(v, _SC("SQFloat64Array expected"));
														
 
															+        void *ary;
														
 
															+        sq_arraygetrawdata(v, ary_idx, &ary);
														
 
															+        SQ_GET_INTEGER(v, 3, constr_type);
														
 
															+        SQ_GET_FLOAT(v, 4, rh);
														
 
															+        //for(SQInteger i= 0, len =sq_getsize(v, ary_idx); i < len; ++i) printf("add_constraint %d %f\n", (int) i, ((REAL*)ary)[i]);
														
 
															+        sq_pushbool(v, self->add_constraint(self, (REAL*)ary, constr_type, rh));
														
 
															+    }
														
 
															+    else sq_pushbool(v, SQFalse);
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_set_lowbo(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_INTEGER(v, 2, colnr);
														
 
															+	SQ_GET_FLOAT(v, 3, val);
														
 
															+	sq_pushbool(v, self->set_lowbo(self, colnr, val));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_set_upbo(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_INTEGER(v, 2, rownr);
														
 
															+	SQ_GET_FLOAT(v, 3, val);
														
 
															+	sq_pushbool(v, self->set_upbo(self, rownr, val));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_set_col_name(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_INTEGER(v, 2, colnr);
														
 
															+	SQ_GET_STRING(v, 3, name);
														
 
															+	sq_pushbool(v, self->set_col_name(self, colnr, (SQChar*)name));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_get_col_name(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_INTEGER(v, 2, colnr);
														
 
															+	sq_pushstring(v, self->get_col_name(self, colnr), -1);
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_set_row_name(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_INTEGER(v, 2, rownr);
														
 
															+	SQ_GET_STRING(v, 3, name);
														
 
															+	sq_pushbool(v, self->set_row_name(self, rownr, (SQChar*)name));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_get_row_name(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_INTEGER(v, 2, rownr);
														
 
															+	sq_pushstring(v, self->get_row_name(self, rownr), -1);
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_set_lp_name(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_STRING(v, 2, name);
														
 
															+	sq_pushbool(v, self->set_lp_name(self, (SQChar*)name));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_get_lp_name(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	sq_pushstring(v, self->get_lp_name(self), -1);
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_write_lp(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_STRING(v, 2, filename);
														
 
															+	sq_pushbool(v, self->write_lp(self, (SQChar*)filename));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_read_problem(HSQUIRRELVM v, lprec *self)
														
 
															+{
														
 
															+	if(self)
														
 
															+    {
														
 
															+        sq_pushstring(v, LPSOLVE_Tag, -1);
														
 
															+        if(sq_getonroottable(v) == SQ_OK){
														
 
															+            if(sq_createinstance(v, -1) == SQ_OK){
														
 
															+                sq_setinstanceup(v, -1, self);
														
 
															+                sq_setreleasehook(v,-1,sq_lpsolve_releasehook);
														
 
															+            }
														
 
															+        }
														
 
															+    }
														
 
															+    else sq_pushnull(v);
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_read_LP(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+	SQ_GET_STRING(v, 2, filename);
														
 
															+	SQ_GET_INTEGER(v, 3, verbose);
														
 
															+	SQ_GET_STRING(v, 4, lp_name);
														
 
															+
														
 
															+	lprec *self = dlread_LP((SQChar*)filename, verbose, (SQChar*)lp_name);
														
 
															+	return sq_lpsolve_read_problem(v, self);
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_read_MPS(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+	SQ_GET_STRING(v, 2, filename);
														
 
															+	SQ_GET_INTEGER(v, 3, options);
														
 
															+
														
 
															+	lprec *self = dlread_MPS((SQChar*)filename, options);
														
 
															+	return sq_lpsolve_read_problem(v, self);
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_read_freeMPS(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+	SQ_GET_STRING(v, 2, filename);
														
 
															+	SQ_GET_INTEGER(v, 3, options);
														
 
															+
														
 
															+	lprec *self = dlread_freeMPS((SQChar*)filename, options);
														
 
															+	return sq_lpsolve_read_problem(v, self);
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_get_mat(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_INTEGER(v, 2, rownr);
														
 
															+	SQ_GET_INTEGER(v, 3, colnr);
														
 
															+	sq_pushfloat(v, self->get_mat(self, rownr, colnr));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_set_mat(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_INTEGER(v, 2, rownr);
														
 
															+	SQ_GET_INTEGER(v, 3, colnr);
														
 
															+	SQ_GET_FLOAT(v, 4, value);
														
 
															+	sq_pushbool(v, self->set_mat(self, rownr, colnr, value));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_solve(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	sq_pushinteger(v, self->solve(self));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_get_objective(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	sq_pushfloat(v, self->get_objective(self));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_get_variables(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+    const SQInteger ary_idx = 2;
														
 
															+    if(sq_gettype(v, ary_idx) == OT_ARRAY)
														
 
															+    {
														
 
															+        SQInteger atype;
														
 
															+        if(sq_arraygettype(v, ary_idx, &atype) != SQ_OK && atype == eat_SQFloat64Array) return sq_throwerror(v, _SC("SQFloat64Array expected"));
														
 
															+        int  ncols = self->get_Ncolumns(self);
														
 
															+        if(sq_getsize(v, ary_idx) != ncols) return sq_throwerror(v, _SC("SQFloat64Array of size %d expected"), ncols);
														
 
															+        void *ary;
														
 
															+        sq_arraygetrawdata(v, ary_idx, &ary);
														
 
															+        sq_pushbool(v, self->get_variables(self, (REAL*)ary));
														
 
															+    }
														
 
															+    else sq_pushbool(v, SQFalse);
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_get_constraints(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+    const SQInteger ary_idx = 2;
														
 
															+    if(sq_gettype(v, ary_idx) == OT_ARRAY)
														
 
															+    {
														
 
															+        SQInteger atype;
														
 
															+        if(sq_arraygettype(v, ary_idx, &atype) != SQ_OK && atype == eat_SQFloat64Array) return sq_throwerror(v, _SC("SQFloat64Array expected"));
														
 
															+        int  nrows = self->get_Nrows(self);
														
 
															+        if(sq_getsize(v, ary_idx) != nrows) return sq_throwerror(v, _SC("SQFloat64Array of size %d expected"), nrows);
														
 
															+        void *ary;
														
 
															+        sq_arraygetrawdata(v, ary_idx, &ary);
														
 
															+        sq_pushbool(v, self->get_constraints(self, (REAL*)ary));
														
 
															+    }
														
 
															+    else sq_pushbool(v, SQFalse);
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_get_nonzeros(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	sq_pushinteger(v, self->get_nonzeros(self));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_get_Nrows(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	sq_pushinteger(v, self->get_Nrows(self));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_get_Ncolumns(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	sq_pushinteger(v, self->get_Ncolumns(self));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_get_timeout(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	sq_pushinteger(v, self->get_timeout(self));
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_lpsolve_set_timeout(HSQUIRRELVM v)
														
 
															+{
														
 
															+	SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    GET_lpsolve_INSTANCE();
														
 
															+	SQ_GET_INTEGER(v, 2, sectimeout);
														
 
															+	self->set_timeout(self, sectimeout);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+#define _DECL_FUNC(name,nparams,tycheck) {_SC(#name),sq_lpsolve_##name,nparams,tycheck}
														
 
															+static SQRegFunction sq_lpsolve_methods[] =
														
 
															+{
														
 
															+	_DECL_FUNC(constructor,3,_SC(".ii")),
														
 
															+    _DECL_FUNC(version,1,_SC(".")),
														
 
															+    _DECL_FUNC(loadlib,2,_SC(".s")),
														
 
															+    _DECL_FUNC(set_verbose,2,_SC("xi")),
														
 
															+    _DECL_FUNC(set_obj_fn,2,_SC("xa")),
														
 
															+    _DECL_FUNC(add_constraint,4,_SC("xain")),
														
 
															+    _DECL_FUNC(set_lowbo,3,_SC("xin")),
														
 
															+    _DECL_FUNC(set_upbo,3,_SC("xin")),
														
 
															+    _DECL_FUNC(set_lp_name,2,_SC("xs")),
														
 
															+    _DECL_FUNC(get_lp_name,1,_SC("x")),
														
 
															+    _DECL_FUNC(set_col_name,3,_SC("xis")),
														
 
															+    _DECL_FUNC(get_col_name,2,_SC("xi")),
														
 
															+    _DECL_FUNC(set_row_name,3,_SC("xis")),
														
 
															+    _DECL_FUNC(get_row_name,2,_SC("xi")),
														
 
															+    _DECL_FUNC(write_lp,2,_SC("xs")),
														
 
															+    _DECL_FUNC(read_LP,4,_SC(".sis")),
														
 
															+    _DECL_FUNC(read_MPS,3,_SC(".si")),
														
 
															+    _DECL_FUNC(read_freeMPS,3,_SC(".si")),
														
 
															+    _DECL_FUNC(get_mat,3,_SC("xii")),
														
 
															+    _DECL_FUNC(set_mat,4,_SC("xiin")),
														
 
															+    _DECL_FUNC(solve,1,_SC("x")),
														
 
															+    _DECL_FUNC(get_objective,1,_SC("x")),
														
 
															+    _DECL_FUNC(get_variables,2,_SC("xa")),
														
 
															+    _DECL_FUNC(get_constraints,2,_SC("xa")),
														
 
															+    _DECL_FUNC(get_nonzeros,1,_SC("x")),
														
 
															+    _DECL_FUNC(get_Nrows,1,_SC("x")),
														
 
															+    _DECL_FUNC(get_Ncolumns,1,_SC("x")),
														
 
															+    _DECL_FUNC(set_timeout,2,_SC("xi")),
														
 
															+    _DECL_FUNC(get_timeout,1,_SC("x")),
														
 
															+    {0,0}
														
 
															+};
														
 
															+#undef _DECL_FUNC
														
 
															+
														
 
															+typedef struct {
														
 
															+  const SQChar *Str;
														
 
															+  SQInteger Val;
														
 
															+} KeyIntType, * KeyIntPtrType;

														
 
															+

														
 
															+static KeyIntType lpsolve_constants[] = {

														
 
															+    #define MK_CONST(c) {_SC(#c), c}

														
 
															+    MK_CONST(NEUTRAL),

														
 
															+    MK_CONST(CRITICAL),

														
 
															+    MK_CONST(SEVERE),

														
 
															+    MK_CONST(IMPORTANT),

														
 
															+    MK_CONST(NORMAL),

														
 
															+    MK_CONST(DETAILED),

														
 
															+    MK_CONST(FULL),
														
 
															+

														
 
															+    MK_CONST(FR),

														
 
															+    MK_CONST(LE),

														
 
															+    MK_CONST(GE),

														
 
															+    MK_CONST(EQ),

														
 
															+    MK_CONST(OF),

														
 
															+    {0,0}

														
 
															+};

														
 
															+
														
 
															+
														
 
															+#ifdef __cplusplus
														
 
															+extern "C" {
														
 
															+#endif
														
 
															+
														
 
															+SQRESULT sqext_register_lpsolve(HSQUIRRELVM v)
														
 
															+{
														
 
															+    sq_pushstring(v,LPSOLVE_Tag,-1);
														
 
															+    sq_newclass(v,SQFalse);
														
 
															+    sq_settypetag(v,-1,(SQUserPointer)LPSOLVE_Tag);
														
 
															+    sq_insert_reg_funcs(v, sq_lpsolve_methods);
														
 
															+
														
 
															+    //add constants
														
 
															+    KeyIntPtrType KeyIntPtr;

														
 
															+    for (KeyIntPtr = lpsolve_constants; KeyIntPtr->Str; KeyIntPtr++) {
														
 
															+        sq_pushstring(v, KeyIntPtr->Str, -1);    //first the key

														
 
															+        sq_pushinteger(v, KeyIntPtr->Val);       //then the value

														
 
															+        sq_newslot(v, -3, SQTrue);              //store then

														
 
															+    }
														
 
															+
														
 
															+    sq_newslot(v,-3,SQTrue);
														
 
															+
														
 
															+    return 0;
														
 
															+}
														
 
															+
														
 
															+#ifdef __cplusplus
														
 
															+}
														
 
															+#endif
														
 
															+
														
 
															+#endif //SQ_USE_LPSOLVE
														
 
															+
														
 
															+
														
 
															+
														
--- a/SquiLu-ext/sq_nn.cpp
+++ b/SquiLu-ext/sq_nn.cpp
@@ -0,0 +1,1474 @@
 
															+#include <stdio.h>
														
 
															+#include "squirrel.h"
														
 
															+#include <string.h>
														
 
															+#include <inttypes.h>
														
 
															+#include <math.h>
														
 
															+#include <stdlib.h>
														
 
															+#include <sys/time.h>
														
 
															+//#include <pthread.h>
														
 
															+
														
 
															+SQ_OPT_STRING_STRLEN();
														
 
															+
														
 
															+extern "C" {
														
 
															+#include "nn.h"
														
 
															+
														
 
															+void *ann_malloc(size_t sz)
														
 
															+{
														
 
															+    return sq_malloc(sz);
														
 
															+}
														
 
															+void ann_free(void *p)
														
 
															+{
														
 
															+    sq_free(p, 0);
														
 
															+}
														
 
															+}
														
 
															+
														
 
															+#define NR_FLAG_NONE 0
														
 
															+#define NR_FLAG_TRAINING (1<<0)         /* NN is training in a thread. */
														
 
															+#define NR_FLAG_REGRESSOR (1<<1)        /* NN will be used for regression. */
														
 
															+#define NR_FLAG_CLASSIFIER (1<<2)       /* NN will be used for classification.*/
														
 
															+#define NR_FLAG_NORMALIZE (1<<3)        /* Perform input/output normalization.*/
														
 
															+#define NR_FLAG_AUTO_STOP (1<<4)        /* Auto stop on training. */
														
 
															+#define NR_FLAG_OF_DETECTED (1<<5)      /* Auto stopped on overfitting. */
														
 
															+#define NR_FLAG_BACKTRACK (1<<6)        /* Auto stop with backtracking. */
														
 
															+
														
 
															+/* Flags to persist when saving the NN. */
														
 
															+#define NR_FLAG_TO_PERSIST (NR_FLAG_REGRESSOR| \
														
 
															+                            NR_FLAG_CLASSIFIER| \
														
 
															+                            NR_FLAG_NORMALIZE| \
														
 
															+                            NR_FLAG_OF_DETECTED)
														
 
															+
														
 
															+/* Flags to transfer after training. */
														
 
															+#define NR_FLAG_TO_TRANSFER (NR_FLAG_OF_DETECTED)
														
 
															+
														
 
															+#define NR_MAX_LAYERS 32
														
 
															+#define NR_RDB_ENC_VER 2
														
 
															+
														
 
															+typedef struct {
														
 
															+    uint32_t len, maxlen;
														
 
															+    float *inputs, *outputs;
														
 
															+} NRDataset;
														
 
															+
														
 
															+typedef struct {
														
 
															+    uint64_t id;        /* Neural network unique ID. */
														
 
															+    uint64_t training_total_steps; /* How many steps of trainig the network
														
 
															+                                      received. A step is a single input/output
														
 
															+                                      pattern presented to the net (counting
														
 
															+                                      the same pattern multiple times) */
														
 
															+    uint64_t training_total_ms;   /* Total milliseconds time of training. */
														
 
															+    uint64_t training_max_cycles; /* Max cycles of a single training. */
														
 
															+    uint64_t training_max_ms; /* Max time of a single training. */
														
 
															+    uint32_t flags;     /* NR_FLAG_... */
														
 
															+    uint32_t epochs;    /* Number of training epochs so far. */
														
 
															+    AnnRprop *nn;     /* Neural network structure. */
														
 
															+    NRDataset dataset;  /* Training dataset. */
														
 
															+    NRDataset test;     /* Testing dataset. */
														
 
															+    float dataset_error;   /* Average error in the training dataset. */
														
 
															+    float test_error;      /* Average error in the test dataset. */
														
 
															+    float test_class_error;    /* Percentage of wrong classifications in test
														
 
															+                                   dataset. Only applicable to nets flagged with
														
 
															+                                   NR_FLAG_CLASSIFIER. */
														
 
															+    /* For normalized (NR_FLAG_NORMALIZE) networks. */
														
 
															+    float *inorm;          /* Inputs normalization factors. */
														
 
															+    float *onorm;          /* Outputs normalization factors. */
														
 
															+} NRTypeObject;
														
 
															+#if 0
														
 
															+typedef struct {
														
 
															+    //RedisModuleString *key; /* Key name of the NN we are training.
														
 
															+    //                           Set to NULL for unused slots. */
														
 
															+    int db_id;              /* DB ID where the key is. */
														
 
															+    pthread_t tid;          /* Thread ID of the trainer. */
														
 
															+    int in_progress;        /* 0 if training terminated. */
														
 
															+    NRTypeObject *nr;       /* A copy of the NN we are training. */
														
 
															+    float dataset_error;    /* Dataset error in the last cycle. */
														
 
															+    float test_error;       /* Test error in the last cycle. */
														
 
															+    float class_error;      /* Percentage of wrong classifications. */
														
 
															+    int curcycle;           /* Current cycle. */
														
 
															+} NRPendingTraining;
														
 
															+#endif
														
 
															+/* We take an array with NNs currently training in other threads.
														
 
															+ * Every time an NN command is called, we try to see if there are
														
 
															+ * finished trainings, in order to udpate weights of the original
														
 
															+ * NN stored into the key (we work on a copy on the other thread).*/
														
 
															+#define NR_PENDING_TRAINING_MAX_LEN 32
														
 
															+
														
 
															+#if 0
														
 
															+#define REDISMODULE_ERR -1
														
 
															+#define REDISMODULE_OK 0
														
 
															+
														
 
															+#define RedisModuleCtx void
														
 
															+
														
 
															+#define RedisModule_Log(ctx, log_level, msg)
														
 
															+
														
 
															+#define UNUSED(V) ((void) V)
														
 
															+typedef SQString RedisModuleString;
														
 
															+
														
 
															+static uint64_t NRNextId = 1; /* Next neural network unique ID. */
														
 
															+
														
 
															+#define RedisModule_Alloc(x) sq_malloc(x)
														
 
															+
														
 
															+static void *RedisModule_Calloc(size_t nelm, size_t sz)
														
 
															+{
														
 
															+    size_t malloc_size = nelm * sz;
														
 
															+    void *ptr = sq_malloc(malloc_size);
														
 
															+    if(ptr) memset(ptr, 0, malloc_size);
														
 
															+    return ptr;
														
 
															+}
														
 
															+
														
 
															+static void *RedisModule_Realloc(void *oldPtr, size_t sz)
														
 
															+{
														
 
															+    void *ptr = sq_realloc(oldPtr, 0, sz);
														
 
															+    return ptr;
														
 
															+}
														
 
															+#define RedisModule_Free(x) sq_free(x, 0)
														
 
															+
														
 
															+static pthread_mutex_t NRPendingTrainingMutex = PTHREAD_MUTEX_INITIALIZER;
														
 
															+/* All the followings must be accessed after acquiring the mutex. */
														
 
															+static NRPendingTraining NRTrainings[NR_PENDING_TRAINING_MAX_LEN];
														
 
															+static int NRPendingTrainingCount = 0; /* Number of pending trainings. */
														
 
															+
														
 
															+/* ========================== Low level object API ========================== */
														
 
															+
														
 
															+long long NRMilliseconds(void) {
														
 
															+    struct timeval tv;
														
 
															+    long long ust;
														
 
															+
														
 
															+    gettimeofday(&tv, NULL);
														
 
															+    ust = ((long long)tv.tv_sec)*1000000;
														
 
															+    ust += tv.tv_usec;
														
 
															+    return ust/1000;
														
 
															+}
														
 
															+
														
 
															+/* Create a network with the specified parameters. Note that the layers
														
 
															+ * must be specified from the output layer[0] to the input
														
 
															+ * layer[N]. Each element in the integer array 'layer' specify how many
														
 
															+ * units there are in the corresponding layer. */
														
 
															+static NRTypeObject *createNRTypeObject(int flags, int *layers, int numlayers, int dset_len, int test_len) {
														
 
															+    NRTypeObject *o;
														
 
															+    o = (NRTypeObject*)RedisModule_Calloc(1,sizeof(*o));
														
 
															+    o->id = NRNextId++;
														
 
															+    o->flags = flags;
														
 
															+    o->nn = AnnCreateNet(numlayers,layers);
														
 
															+    o->dataset.maxlen = dset_len;
														
 
															+    o->test.maxlen = test_len;
														
 
															+    int ilen = ANN_INPUT_UNITS(o->nn);
														
 
															+    int olen = ANN_OUTPUT_UNITS(o->nn);
														
 
															+    o->inorm = (float*)RedisModule_Calloc(1,sizeof(float)*ilen);
														
 
															+    o->onorm = (float*)RedisModule_Calloc(1,sizeof(float)*olen);
														
 
															+    for (int j = 0; j < ilen; j++) o->inorm[j] = 1;
														
 
															+    for (int j = 0; j < olen; j++) o->onorm[j] = 1;
														
 
															+    return o;
														
 
															+}
														
 
															+
														
 
															+/* Insert data (observations needed to train and test the NN) into the
														
 
															+ * NN object. While the learning and testing datasets are yet not full
														
 
															+ * the observed pattern is inserted evenly in one or the other side in
														
 
															+ * order to make sure the two datasets are populated evenly. When both
														
 
															+ * are already full, a random elmenet from one or the other (doing
														
 
															+ * a random weighted choice depending on the length) is substituted with
														
 
															+ * the new item. */
														
 
															+#define NR_INSERT_NO_TARGET 0   /* Auto select where to insert. */
														
 
															+#define NR_INSERT_TRAIN 1       /* Insert in training dataset. */
														
 
															+#define NR_INSERT_TEST 2        /* Insert in testing dataset. */
														
 
															+static void NRTypeInsertData(NRTypeObject *o, float *inputs, float *outputs,
														
 
															+                      int target_ds) {
														
 
															+    NRDataset *target = NULL;
														
 
															+
														
 
															+    /* Check if there is no dataset at all. This may be a valid setup
														
 
															+     * with online learning, sample by sample. */
														
 
															+    if (o->dataset.maxlen == 0 && o->test.maxlen == 0) return;
														
 
															+
														
 
															+    /* If the user specified a target, select it. */
														
 
															+    if (target_ds == NR_INSERT_TRAIN) target = &o->dataset;
														
 
															+    else if (target_ds == NR_INSERT_TEST) target = &o->test;
														
 
															+
														
 
															+    /* If no target is specified, but there is only one possible
														
 
															+     * target, select it ASAP. */
														
 
															+    if (o->dataset.maxlen == 0) {
														
 
															+        target = &o->test;
														
 
															+    } else if (o->test.maxlen == 0) {
														
 
															+        target = &o->dataset;
														
 
															+    }
														
 
															+
														
 
															+    /* Otherwise choose as the target to populate the one with less data
														
 
															+     * relatively to its size. */
														
 
															+    if (target == NULL) {
														
 
															+        /* If one of the two datasets are still not full, pick
														
 
															+         * based on fill percentage. Otherwise pick a random
														
 
															+         * target relatively to their size. */
														
 
															+        if (o->dataset.len != o->dataset.maxlen ||
														
 
															+            o->test.len != o->dataset.len)
														
 
															+        {
														
 
															+            float fill_a = (float)o->dataset.len / o->dataset.maxlen;
														
 
															+            float fill_b = (float)o->test.len / o->test.maxlen;
														
 
															+            target = (fill_a <= fill_b) ? &o->dataset : &o->test;
														
 
															+        } else {
														
 
															+            double r = rand()/RAND_MAX;
														
 
															+            double sumlen = o->dataset.maxlen + o->test.maxlen;
														
 
															+            if (r < (double)o->dataset.maxlen/sumlen) {
														
 
															+                target = &o->dataset;
														
 
															+            } else {
														
 
															+                target = &o->test;
														
 
															+            }
														
 
															+        }
														
 
															+    }
														
 
															+
														
 
															+    /* Append if there is room or substitute with a random entry. */
														
 
															+    size_t idx;
														
 
															+    int j, numin = ANN_INPUT_UNITS(o->nn),
														
 
															+           numout = ANN_OUTPUT_UNITS(o->nn);
														
 
															+
														
 
															+    if (target->maxlen == target->len) {
														
 
															+        idx = rand() % target->maxlen;
														
 
															+    } else {
														
 
															+        idx = target->len;
														
 
															+        target->len++;
														
 
															+        target->inputs = (float*)RedisModule_Realloc(target->inputs,
														
 
															+            sizeof(float)*numin*target->len);
														
 
															+        target->outputs = (float*)RedisModule_Realloc(target->outputs,
														
 
															+            sizeof(float)*numout*target->len);
														
 
															+    }
														
 
															+
														
 
															+    /* Finally store the values at position. */
														
 
															+    for (j = 0; j < numin; j++)
														
 
															+        target->inputs[idx*numin+j] = inputs[j];
														
 
															+    for (j = 0; j < numout; j++)
														
 
															+        target->outputs[idx*numout+j] = outputs[j];
														
 
															+}
														
 
															+
														
 
															+/* Free the specified dataset. */
														
 
															+void NRDatasetFree(NRDataset *dset) {
														
 
															+    RedisModule_Free(dset->inputs);
														
 
															+    RedisModule_Free(dset->outputs);
														
 
															+}
														
 
															+
														
 
															+/* Free a whole NN object. */
														
 
															+void NRTypeReleaseObject(NRTypeObject *o) {
														
 
															+    AnnFree(o->nn);
														
 
															+    NRDatasetFree(&o->dataset);
														
 
															+    NRDatasetFree(&o->test);
														
 
															+    RedisModule_Free(o->inorm);
														
 
															+    RedisModule_Free(o->onorm);
														
 
															+    RedisModule_Free(o);
														
 
															+}
														
 
															+
														
 
															+/* ================================ Training =============================== */
														
 
															+
														
 
															+/* Clone a neural network object, including the training and test dataset.
														
 
															+ * We use cloning in order to train in a different thread, and later
														
 
															+ * copy the weights back into the original NN.
														
 
															+ *
														
 
															+ * Note when 'newid' is 0, the copied object NN unique ID is the same as the
														
 
															+ * original as normally this is what we want, in order to later match the
														
 
															+ * trained network with the object stored at the specified key
														
 
															+ * in the pending traning structure.
														
 
															+ *
														
 
															+ * However if the copy is performed with other goals, 'newid' should
														
 
															+ * be set to non-zero in order to create a net with a different ID. */
														
 
															+NRTypeObject *NRClone(NRTypeObject *o, int newid) {
														
 
															+    NRTypeObject *copy;
														
 
															+    copy = (NRTypeObject*)RedisModule_Calloc(1,sizeof(*o));
														
 
															+    *copy = *o;
														
 
															+    if (newid) copy->id = NRNextId++;
														
 
															+    copy->nn = AnnClone(o->nn);
														
 
															+    copy->dataset = o->dataset;
														
 
															+    copy->test = o->test;
														
 
															+
														
 
															+    int ilen = ANN_INPUT_UNITS(o->nn);
														
 
															+    int olen = ANN_OUTPUT_UNITS(o->nn);
														
 
															+    copy->dataset.inputs = (float*)RedisModule_Alloc(sizeof(float)*ilen*o->dataset.len);
														
 
															+    copy->dataset.outputs = (float*)RedisModule_Alloc(sizeof(float)*olen*o->dataset.len);
														
 
															+    copy->test.inputs = (float*)RedisModule_Alloc(sizeof(float)*ilen*o->test.len);
														
 
															+    copy->test.outputs = (float*)RedisModule_Alloc(sizeof(float)*olen*o->test.len);
														
 
															+    memcpy(copy->dataset.inputs,o->dataset.inputs,sizeof(float)*ilen*o->dataset.len);
														
 
															+    memcpy(copy->dataset.outputs,o->dataset.outputs,sizeof(float)*olen*o->dataset.len);
														
 
															+    memcpy(copy->test.inputs,o->test.inputs,sizeof(float)*ilen*o->test.len);
														
 
															+    memcpy(copy->test.outputs,o->test.outputs,sizeof(float)*olen*o->test.len);
														
 
															+
														
 
															+    copy->inorm = (float*)RedisModule_Alloc(sizeof(float)*ilen);
														
 
															+    copy->onorm = (float*)RedisModule_Alloc(sizeof(float)*olen);
														
 
															+    memcpy(copy->inorm,o->inorm,sizeof(float)*ilen);
														
 
															+    memcpy(copy->onorm,o->onorm,sizeof(float)*olen);
														
 
															+    return copy;
														
 
															+}
														
 
															+
														
 
															+/* Transfer the weights from the source to the destination NN.
														
 
															+ * This is used after the learning process finished in a different
														
 
															+ * thread in order to transfer the learning back to the orignal
														
 
															+ * NN. */
														
 
															+static void NRTransferWeights(RedisModuleCtx *ctx, NRTypeObject *dst, NRTypeObject *src) {
														
 
															+    if (dst->id != src->id) {
														
 
															+        RedisModule_Log(ctx,"warning",
														
 
															+            "NSTransferWeight(): source and destination neural network IDs "
														
 
															+            "don't match. This is unexpected, probably a bug inside the "
														
 
															+            "module. Weights not transferred back to the origina NN.");
														
 
															+        return;
														
 
															+    }
														
 
															+
														
 
															+    /* It would be faster to memcpy just the weight array for each layer,
														
 
															+     * however this way we access the NN in a more abstract way, and should
														
 
															+     * be fast enough in most cases. We can always optimized it later. */
														
 
															+    AnnFree(dst->nn);
														
 
															+    dst->nn = AnnClone(src->nn);
														
 
															+    dst->training_total_steps = src->training_total_steps;
														
 
															+    dst->training_total_ms = src->training_total_ms;
														
 
															+    dst->dataset_error = src->dataset_error;
														
 
															+    dst->test_error = src->test_error;
														
 
															+    dst->test_class_error = src->test_class_error;
														
 
															+    dst->flags |= src->flags & NR_FLAG_TO_TRANSFER;
														
 
															+
														
 
															+    int ilen = ANN_INPUT_UNITS(src->nn);
														
 
															+    int olen = ANN_OUTPUT_UNITS(src->nn);
														
 
															+    memcpy(dst->inorm,src->inorm,sizeof(float)*ilen);
														
 
															+    memcpy(dst->onorm,src->onorm,sizeof(float)*olen);
														
 
															+}
														
 
															+
														
 
															+/* Threaded training entry point.
														
 
															+ *
														
 
															+ * To get some clue about overfitting algorithm behavior:
														
 
															+ * #define NR_TRAINING_DEBUG 1
														
 
															+ */
														
 
															+void *NRTrainingThreadMain(void *arg) {
														
 
															+    NRPendingTraining *pt = (NRPendingTraining*)arg;
														
 
															+    NRTypeObject *nr = pt->nr;
														
 
															+    int training_iterations = 1;
														
 
															+    float train_error = 0;
														
 
															+    float test_error = 0;
														
 
															+    float class_error = 0;
														
 
															+    float past_train_error = 1.0/0.0;
														
 
															+    float past_test_error = 1.0/0.0;
														
 
															+    int auto_stop = nr->flags & NR_FLAG_AUTO_STOP;
														
 
															+    int backtrack = nr->flags & NR_FLAG_BACKTRACK;
														
 
															+
														
 
															+    uint64_t cycles = 0;
														
 
															+    long long start = NRMilliseconds();
														
 
															+    long long cycle_time;
														
 
															+    int overfitting_count = 0;
														
 
															+    int overfitting_limit = 5;
														
 
															+    float best_test_error = 1.0/0.0;
														
 
															+
														
 
															+    nr->flags &= ~NR_FLAG_TO_TRANSFER;
														
 
															+
														
 
															+    /* If the network is auto normalized, we need to trasnform the inputs
														
 
															+     * in a way that's acceptable for the NN. We just find the maximum
														
 
															+     * absolute value, and divide for it, to get a -1,1 range. There
														
 
															+     * are more advanced transformations that are usually performed that
														
 
															+     * could be implemented in the future.
														
 
															+     *
														
 
															+     * Note that we compute the normalization vectors for all the inputs
														
 
															+     * and outputs, however if the network is a classifier, flagged with
														
 
															+     * (NR_FLAG_CLASSIFIER), no output normalization will be done since
														
 
															+     * the data is already in 0/1 format. */
														
 
															+    if ((nr->flags & NR_FLAG_NORMALIZE) && nr->dataset.len) {
														
 
															+        int ilen = ANN_INPUT_UNITS(nr->nn);
														
 
															+        int olen = ANN_OUTPUT_UNITS(nr->nn);
														
 
															+        float *imax = nr->inorm;
														
 
															+        float *omax = nr->onorm;
														
 
															+        float *inputs = nr->dataset.inputs;
														
 
															+        float *outputs = nr->dataset.outputs;
														
 
															+        for (int i = 0; i < ilen; i++) imax[i] = 1;
														
 
															+        for (int i = 0; i < olen; i++) omax[i] = 1;
														
 
															+
														
 
															+        /* Compute the max values vectors. */
														
 
															+        for (uint32_t j = 0; j < nr->dataset.len; j++) {
														
 
															+            for (int i = 0; i < ilen; i++)
														
 
															+                if (fabs(inputs[i]) > imax[i]) imax[i] = fabs(inputs[i]);
														
 
															+            for (int i = 0; i < olen; i++)
														
 
															+                if (fabs(outputs[i]) > omax[i]) omax[i] = fabs(outputs[i]);
														
 
															+            inputs += ilen;
														
 
															+            outputs += olen;
														
 
															+        }
														
 
															+
														
 
															+        /* Likely we are not seeing what will really be the true input/output
														
 
															+         * maximum value, so we multiply the maximum values found by a constant.
														
 
															+         * However if the max is exactly "1" we assume it's a classification
														
 
															+         * input and don't alter it. */
														
 
															+        for (int i = 0; i < ilen; i++) if (imax[i] != 1) imax[i] *= 1.2;
														
 
															+        for (int i = 0; i < olen; i++) if (omax[i] != 1) omax[i] *= 1.2;
														
 
															+
														
 
															+        /* We can normalize the dataset directly: after the training it will
														
 
															+         * be discarded anyway. */
														
 
															+        inputs = nr->dataset.inputs;
														
 
															+        outputs = nr->dataset.outputs;
														
 
															+        for (uint32_t j = 0; j < nr->dataset.len; j++) {
														
 
															+            for (int i = 0; i < ilen; i++) inputs[i] /= nr->inorm[i];
														
 
															+            if (!(nr->flags & NR_FLAG_CLASSIFIER))
														
 
															+                for (int i = 0; i < olen; i++) outputs[i] /= nr->onorm[i];
														
 
															+            inputs += ilen;
														
 
															+            outputs += olen;
														
 
															+        }
														
 
															+
														
 
															+        inputs = nr->test.inputs;
														
 
															+        outputs = nr->test.outputs;
														
 
															+        for (uint32_t j = 0; j < nr->test.len; j++) {
														
 
															+            for (int i = 0; i < ilen; i++) inputs[i] /= nr->inorm[i];
														
 
															+            if (!(nr->flags & NR_FLAG_CLASSIFIER))
														
 
															+                for (int i = 0; i < olen; i++) outputs[i] /= nr->onorm[i];
														
 
															+            inputs += ilen;
														
 
															+            outputs += olen;
														
 
															+        }
														
 
															+    }
														
 
															+
														
 
															+    AnnRprop *saved = NULL;  /* Saved to recover on overfitting. */
														
 
															+    float saved_error;          /* The test error of the saved NN. */
														
 
															+    float saved_train_error;    /* The training dataset error of the saved NN */
														
 
															+    float saved_class_error;    /* The % of classification errors of saved NN */
														
 
															+
														
 
															+    while(1) {
														
 
															+        long long cycle_start = NRMilliseconds();
														
 
															+
														
 
															+        train_error = AnnTrain(nr->nn,
														
 
															+                               nr->dataset.inputs,
														
 
															+                               nr->dataset.outputs,
														
 
															+                               0,
														
 
															+                               training_iterations,
														
 
															+                               nr->dataset.len,
														
 
															+                               ANN_ALGO_BPROP);
														
 
															+        cycle_time = NRMilliseconds() - cycle_start;
														
 
															+        nr->training_total_steps += nr->dataset.len*training_iterations;
														
 
															+
														
 
															+        /* Evaluate the error in the case of auto training, stop it
														
 
															+         * once we see that the error in the traning set is decreasing
														
 
															+         * while the one in the test set is not. */
														
 
															+        if (auto_stop) {
														
 
															+            AnnTestError(nr->nn,
														
 
															+                         nr->test.inputs,
														
 
															+                         nr->test.outputs,
														
 
															+                         nr->test.len, &test_error, &class_error);
														
 
															+
														
 
															+            if (train_error < past_train_error &&
														
 
															+                test_error > past_test_error)
														
 
															+            {
														
 
															+                overfitting_count++;
														
 
															+                #ifdef NR_TRAINING_DEBUG
														
 
															+                printf("+YCLE %lld: [%d] %f VS %f\n", (long long)cycles,
														
 
															+                    overfitting_count, train_error, test_error);
														
 
															+                #endif
														
 
															+                if (overfitting_count == overfitting_limit) {
														
 
															+                    nr->flags |= NR_FLAG_OF_DETECTED;
														
 
															+                    break;
														
 
															+                }
														
 
															+            } else if (overfitting_count > 0) {
														
 
															+                #ifdef NR_TRAINING_DEBUG
														
 
															+                printf("-YCLE %lld: [%d] %f VS %f\n", (long long)cycles,
														
 
															+                    overfitting_count, train_error, test_error);
														
 
															+                #endif
														
 
															+                overfitting_count--;
														
 
															+            }
														
 
															+
														
 
															+            /* Save all the networks with a score better than the currently
														
 
															+             * saved network. This can be a bit costly, but is safe: one
														
 
															+             * cycle of training more and overfitting can ruin it all. */
														
 
															+            if (backtrack && (saved == NULL || test_error < saved_error)) {
														
 
															+                #ifdef NR_TRAINING_DEBUG
														
 
															+                printf("SAVED! %f < %f\n", test_error, saved_error);
														
 
															+                #endif
														
 
															+                saved_error = test_error;
														
 
															+                saved_train_error = train_error;
														
 
															+                saved_class_error = class_error;
														
 
															+                if (saved) AnnFree(saved);
														
 
															+                saved = AnnClone(nr->nn);
														
 
															+            }
														
 
															+
														
 
															+            /* Best network found? Reset the overfitting hints counter. */
														
 
															+            if (test_error < best_test_error) {
														
 
															+                overfitting_count = 0;
														
 
															+                best_test_error = test_error;
														
 
															+                #ifdef NR_TRAINING_DEBUG
														
 
															+                printf("BEST! %lld: <%d> %f VS %f\n", (long long)cycles,
														
 
															+                    overfitting_limit,train_error, test_error);
														
 
															+                #endif
														
 
															+            }
														
 
															+
														
 
															+           /* Also stop if the loss is zero in both datasets. */
														
 
															+            if (train_error < 0.000000000000001 &&
														
 
															+                test_error  < 0.000000000000001) break;
														
 
															+        }
														
 
															+
														
 
															+        cycles++;
														
 
															+        long long total_time = NRMilliseconds()-start;
														
 
															+
														
 
															+        /* Cycles and milliseconds stop conditions. */
														
 
															+        if (nr->training_max_cycles && cycles == nr->training_max_cycles)
														
 
															+            break;
														
 
															+        if (nr->training_max_ms && total_time > (long long)nr->training_max_ms)
														
 
															+            break;
														
 
															+
														
 
															+        /* If this is a long training, to do just a single training iteration
														
 
															+         * for each cycle is not optimal: tune the number of iterations to
														
 
															+         * at least take 100 milliseconds. */
														
 
															+        if (total_time > 10000 && cycle_time < 100) training_iterations++;
														
 
															+
														
 
															+        past_train_error = train_error;
														
 
															+        past_test_error = test_error;
														
 
															+
														
 
															+        /* Update stats for NR.THREADS to show progresses. */
														
 
															+        pthread_mutex_lock(&NRPendingTrainingMutex);
														
 
															+        pt->dataset_error = train_error;
														
 
															+        pt->test_error = test_error;
														
 
															+        if (nr->flags & NR_FLAG_CLASSIFIER) pt->class_error = class_error;
														
 
															+        pt->curcycle = cycles;
														
 
															+        pthread_mutex_unlock(&NRPendingTrainingMutex);
														
 
															+    }
														
 
															+
														
 
															+    /* If auto stop is disabled, we still need to compute the test error
														
 
															+     * in order to return this information to the main thread. */
														
 
															+    if (!auto_stop) {
														
 
															+        AnnTestError(nr->nn,
														
 
															+                     nr->test.inputs,
														
 
															+                     nr->test.outputs,
														
 
															+                     nr->test.len, &test_error, &class_error);
														
 
															+    }
														
 
															+
														
 
															+    /* If both autostop and backtracking are enabled, we may have
														
 
															+     * a better network saved! */
														
 
															+    if (auto_stop && backtrack) {
														
 
															+        if (saved && saved_error < test_error) {
														
 
															+            #ifdef NR_TRAINING_DEBUG
														
 
															+            printf("BACKTRACK: Saved network used!\n");
														
 
															+            #endif
														
 
															+            AnnFree(nr->nn);
														
 
															+            nr->nn = saved;
														
 
															+            test_error = saved_error;
														
 
															+            train_error = saved_train_error;
														
 
															+            class_error = saved_class_error;
														
 
															+        } else if (saved) {
														
 
															+            AnnFree(saved);
														
 
															+        }
														
 
															+    }
														
 
															+
														
 
															+    if (nr->flags & NR_FLAG_CLASSIFIER) nr->test_class_error = class_error;
														
 
															+    nr->dataset_error = train_error;
														
 
															+    nr->test_error = test_error;
														
 
															+    nr->training_total_ms += NRMilliseconds()-start;
														
 
															+
														
 
															+    /* Signal that the training process has finished, it's up to the main
														
 
															+     * thread to cleanup this training slot, copying the weights to the
														
 
															+     * original neural network and reclaiming memory for the copy we
														
 
															+     * used to work. */
														
 
															+    pthread_mutex_lock(&NRPendingTrainingMutex);
														
 
															+    pt->in_progress = 0;
														
 
															+    pthread_mutex_unlock(&NRPendingTrainingMutex);
														
 
															+    return NULL;
														
 
															+}
														
 
															+
														
 
															+/* Start a background training in another thread. Return REDISMODULE_ERR if
														
 
															+ * there is no free slot for training, as we already reached the maximum of
														
 
															+ * networks we can train in parallel.
														
 
															+ *
														
 
															+ * The 'flags' argument specifies the additional NN flags to pass to the
														
 
															+ * training ruotine:
														
 
															+ *
														
 
															+ *  NR_FLAG_AUTO_STOP -- Automatically stop training on overtraining.
														
 
															+ *  NR_FLAG_BACKTRACK -- Save current NN state when overfitting is likely.
														
 
															+ */
														
 
															+int NRStartTraining(RedisModuleCtx *ctx, RedisModuleString *key, int dbid, NRTypeObject *nr) {
														
 
															+    pthread_mutex_lock(&NRPendingTrainingMutex);
														
 
															+    if (NRPendingTrainingCount == NR_PENDING_TRAINING_MAX_LEN) {
														
 
															+        pthread_mutex_unlock(&NRPendingTrainingMutex);
														
 
															+        return REDISMODULE_ERR;
														
 
															+    }
														
 
															+
														
 
															+    /* Setup our trainig data. */
														
 
															+    NRPendingTraining *pt = &NRTrainings[NRPendingTrainingCount];
														
 
															+    //pt->key = RedisModule_CreateStringFromString(ctx,key);
														
 
															+    //RedisModule_RetainString(ctx,pt->key);
														
 
															+    pt->db_id = dbid;
														
 
															+    pt->in_progress = 1;
														
 
															+    pt->nr = NRClone(nr,0);
														
 
															+    pt->dataset_error = 0;
														
 
															+    pt->test_error = 0;
														
 
															+    pt->class_error = 0;
														
 
															+    pt->curcycle = 0;
														
 
															+    if (pthread_create(&pt->tid,NULL,NRTrainingThreadMain,pt) != 0) {
														
 
															+        RedisModule_Log(ctx,"warning","Unable to create a new pthread in NRStartTraining()");
														
 
															+        //RedisModule_FreeString(ctx,pt->key);
														
 
															+        pt->key = NULL;
														
 
															+        NRTypeReleaseObject(pt->nr);
														
 
															+        pthread_mutex_unlock(&NRPendingTrainingMutex);
														
 
															+        return REDISMODULE_ERR;
														
 
															+    }
														
 
															+    NRPendingTrainingCount++;
														
 
															+    nr->flags |= NR_FLAG_TRAINING;
														
 
															+    nr->flags &= ~NR_FLAG_TO_TRANSFER;
														
 
															+    pthread_mutex_unlock(&NRPendingTrainingMutex);
														
 
															+    return REDISMODULE_OK;
														
 
															+}
														
 
															+
														
 
															+/* Check if there are threads that terminated the NN training, and
														
 
															+ * collect the info they computed (that is the new NN). */
														
 
															+int NRCollectThreads(RedisModuleCtx *ctx) {
														
 
															+    int collected = 0;
														
 
															+    pthread_mutex_lock(&NRPendingTrainingMutex);
														
 
															+    for (int j = 0; j < NRPendingTrainingCount; j++) {
														
 
															+        NRPendingTraining *pt = &NRTrainings[j];
														
 
															+        if (pt->in_progress == 0) {
														
 
															+            /* Training terminated. Let's see if the key
														
 
															+             * is still there and NN ID matches. */
														
 
															+            int orig_id = RedisModule_GetSelectedDb(ctx);
														
 
															+            if (orig_id != pt->db_id) RedisModule_SelectDb(ctx,pt->db_id);
														
 
															+            RedisModuleKey *key = RedisModule_OpenKey(ctx,pt->key,
														
 
															+                REDISMODULE_READ|REDISMODULE_WRITE);
														
 
															+            if (RedisModule_ModuleTypeGetType(key) == NRType) {
														
 
															+                NRTypeObject *nr = RedisModule_ModuleTypeGetValue(key);
														
 
															+                if (nr->id == pt->nr->id) {
														
 
															+                    NRTransferWeights(ctx,nr,pt->nr);
														
 
															+                    nr->flags &= ~NR_FLAG_TRAINING;
														
 
															+                }
														
 
															+                RedisModule_FreeString(ctx,pt->key);
														
 
															+                pt->key = NULL;
														
 
															+                NRTypeReleaseObject(pt->nr);
														
 
															+                NRPendingTrainingCount--;
														
 
															+                memcpy(&NRTrainings[j],&NRTrainings[j+1],
														
 
															+                    (NRPendingTrainingCount-j)*sizeof(NRTrainings[0]));
														
 
															+            }
														
 
															+            if (orig_id != pt->db_id) RedisModule_SelectDb(ctx,orig_id);
														
 
															+            collected++;
														
 
															+        }
														
 
															+    }
														
 
															+    pthread_mutex_unlock(&NRPendingTrainingMutex);
														
 
															+    return collected;
														
 
															+}
														
 
															+#endif // 0
														
 
															+
														
 
															+#define RedisModule_Free(x) sq_free(x, 0)
														
 
															+
														
 
															+static void *RedisModule_Calloc(size_t nelm, size_t sz)
														
 
															+{
														
 
															+    size_t malloc_size = nelm * sz;
														
 
															+    void *ptr = sq_malloc(malloc_size);
														
 
															+    if(ptr) memset(ptr, 0, malloc_size);
														
 
															+    return ptr;
														
 
															+}
														
 
															+
														
 
															+static void *RedisModule_Realloc(void *oldPtr, size_t sz)
														
 
															+{
														
 
															+    void *ptr = sq_realloc(oldPtr, 0, sz);
														
 
															+    return ptr;
														
 
															+}
														
 
															+
														
 
															+static uint64_t NRNextId = 1; /* Next neural network unique ID. */
														
 
															+
														
 
															+long long NRMilliseconds(void) {
														
 
															+    struct timeval tv;
														
 
															+    long long ust;
														
 
															+
														
 
															+    gettimeofday(&tv, NULL);
														
 
															+    ust = ((long long)tv.tv_sec)*1000000;
														
 
															+    ust += tv.tv_usec;
														
 
															+    return ust/1000;
														
 
															+}
														
 
															+
														
 
															+/* Create a network with the specified parameters. Note that the layers
														
 
															+ * must be specified from the output layer[0] to the input
														
 
															+ * layer[N]. Each element in the integer array 'layer' specify how many
														
 
															+ * units there are in the corresponding layer. */
														
 
															+static NRTypeObject *createNRTypeObject(int flags, int *layers, int numlayers, int dset_len, int test_len) {
														
 
															+    NRTypeObject *o;
														
 
															+    o = (NRTypeObject*)RedisModule_Calloc(1,sizeof(*o));
														
 
															+    o->id = NRNextId++;
														
 
															+    o->flags = flags;
														
 
															+    o->nn = AnnCreateNet(numlayers,layers);
														
 
															+    o->dataset.maxlen = dset_len;
														
 
															+    o->test.maxlen = test_len;
														
 
															+    int ilen = ANN_INPUT_UNITS(o->nn);
														
 
															+    int olen = ANN_OUTPUT_UNITS(o->nn);
														
 
															+    o->inorm = (float*)RedisModule_Calloc(1,sizeof(float)*ilen);
														
 
															+    o->onorm = (float*)RedisModule_Calloc(1,sizeof(float)*olen);
														
 
															+    for (int j = 0; j < ilen; j++) o->inorm[j] = 1;
														
 
															+    for (int j = 0; j < olen; j++) o->onorm[j] = 1;
														
 
															+    return o;
														
 
															+}
														
 
															+
														
 
															+/* Insert data (observations needed to train and test the NN) into the
														
 
															+ * NN object. While the learning and testing datasets are yet not full
														
 
															+ * the observed pattern is inserted evenly in one or the other side in
														
 
															+ * order to make sure the two datasets are populated evenly. When both
														
 
															+ * are already full, a random elmenet from one or the other (doing
														
 
															+ * a random weighted choice depending on the length) is substituted with
														
 
															+ * the new item. */
														
 
															+#define NR_INSERT_NO_TARGET 0   /* Auto select where to insert. */
														
 
															+#define NR_INSERT_TRAIN 1       /* Insert in training dataset. */
														
 
															+#define NR_INSERT_TEST 2        /* Insert in testing dataset. */
														
 
															+static void NRTypeInsertData(NRTypeObject *o, float *inputs, float *outputs,
														
 
															+                      int target_ds) {
														
 
															+    NRDataset *target = NULL;
														
 
															+
														
 
															+    /* Check if there is no dataset at all. This may be a valid setup
														
 
															+     * with online learning, sample by sample. */
														
 
															+    if (o->dataset.maxlen == 0 && o->test.maxlen == 0) return;
														
 
															+
														
 
															+    /* If the user specified a target, select it. */
														
 
															+    if (target_ds == NR_INSERT_TRAIN) target = &o->dataset;
														
 
															+    else if (target_ds == NR_INSERT_TEST) target = &o->test;
														
 
															+
														
 
															+    /* If no target is specified, but there is only one possible
														
 
															+     * target, select it ASAP. */
														
 
															+    if (o->dataset.maxlen == 0) {
														
 
															+        target = &o->test;
														
 
															+    } else if (o->test.maxlen == 0) {
														
 
															+        target = &o->dataset;
														
 
															+    }
														
 
															+
														
 
															+    /* Otherwise choose as the target to populate the one with less data
														
 
															+     * relatively to its size. */
														
 
															+    if (target == NULL) {
														
 
															+        /* If one of the two datasets are still not full, pick
														
 
															+         * based on fill percentage. Otherwise pick a random
														
 
															+         * target relatively to their size. */
														
 
															+        if (o->dataset.len != o->dataset.maxlen ||
														
 
															+            o->test.len != o->dataset.len)
														
 
															+        {
														
 
															+            float fill_a = (float)o->dataset.len / o->dataset.maxlen;
														
 
															+            float fill_b = (float)o->test.len / o->test.maxlen;
														
 
															+            target = (fill_a <= fill_b) ? &o->dataset : &o->test;
														
 
															+        } else {
														
 
															+            double r = rand()/RAND_MAX;
														
 
															+            double sumlen = o->dataset.maxlen + o->test.maxlen;
														
 
															+            if (r < (double)o->dataset.maxlen/sumlen) {
														
 
															+                target = &o->dataset;
														
 
															+            } else {
														
 
															+                target = &o->test;
														
 
															+            }
														
 
															+        }
														
 
															+    }
														
 
															+
														
 
															+    /* Append if there is room or substitute with a random entry. */
														
 
															+    size_t idx;
														
 
															+    int j, numin = ANN_INPUT_UNITS(o->nn),
														
 
															+           numout = ANN_OUTPUT_UNITS(o->nn);
														
 
															+
														
 
															+    if (target->maxlen == target->len) {
														
 
															+        idx = rand() % target->maxlen;
														
 
															+    } else {
														
 
															+        idx = target->len;
														
 
															+        target->len++;
														
 
															+        target->inputs = (float*)RedisModule_Realloc(target->inputs,
														
 
															+            sizeof(float)*numin*target->len);
														
 
															+        target->outputs = (float*)RedisModule_Realloc(target->outputs,
														
 
															+            sizeof(float)*numout*target->len);
														
 
															+    }
														
 
															+
														
 
															+    /* Finally store the values at position. */
														
 
															+    for (j = 0; j < numin; j++)
														
 
															+        target->inputs[idx*numin+j] = inputs[j];
														
 
															+    for (j = 0; j < numout; j++)
														
 
															+        target->outputs[idx*numout+j] = outputs[j];
														
 
															+}
														
 
															+
														
 
															+/* Free the specified dataset. */
														
 
															+void NRDatasetFree(NRDataset *dset) {
														
 
															+    RedisModule_Free(dset->inputs);
														
 
															+    RedisModule_Free(dset->outputs);
														
 
															+}
														
 
															+
														
 
															+/* Free a whole NN object. */
														
 
															+void NRTypeReleaseObject(NRTypeObject *o) {
														
 
															+    AnnFree(o->nn);
														
 
															+    NRDatasetFree(&o->dataset);
														
 
															+    NRDatasetFree(&o->test);
														
 
															+    RedisModule_Free(o->inorm);
														
 
															+    RedisModule_Free(o->onorm);
														
 
															+    RedisModule_Free(o);
														
 
															+}
														
 
															+
														
 
															+static const SQChar sq_nn_TAG[] = _SC("AnnRprop");
														
 
															+
														
 
															+static SQRESULT sq_nn_release_hook(SQUserPointer p, SQInteger size, void */*ep*/) {
														
 
															+    NRTypeObject *self = (NRTypeObject *)p;
														
 
															+    if(self) NRTypeReleaseObject(self);
														
 
															+    return 0;
														
 
															+}
														
 
															+
														
 
															+/*
														
 
															+** Creates a new AnnRprop.
														
 
															+*/
														
 
															+static SQRESULT sq_nn_constructor (HSQUIRRELVM v) {
														
 
															+    SQ_FUNC_VARS(v);
														
 
															+    SQ_GET_INTEGER(v, 2, flags);
														
 
															+    SQ_GET_INTEGER(v, 3, ninputs);
														
 
															+    const SQInteger nhidden_pos = 4;
														
 
															+    SQ_GET_INTEGER(v, 5, noutputs);
														
 
															+    SQ_OPT_INTEGER(v, 6, ndata, 0);
														
 
															+    SQ_OPT_INTEGER(v, 7, ntest, 0);
														
 
															+
														
 
															+    if(!(
														
 
															+            ((flags & NR_FLAG_CLASSIFIER) && !(flags & NR_FLAG_REGRESSOR))
														
 
															+            || (!(flags & NR_FLAG_CLASSIFIER) && (flags & NR_FLAG_REGRESSOR))
														
 
															+         )
														
 
															+       )
														
 
															+        return sq_throwerror(v, _SC("invalid neural network type. Must be "
														
 
															+                                    "CLASSIFIER or REGRESSOR"));
														
 
															+
														
 
															+    int layers[NR_MAX_LAYERS], num_layers=0;
														
 
															+    layers[num_layers++] = noutputs;
														
 
															+
														
 
															+    /* Our NN library takes the definition of layers in the opposite
														
 
															+     * order, swap the layers array. */
														
 
															+    SQInteger asize = sq_getsize(v, nhidden_pos);
														
 
															+    for(int i=asize-1; i >= 0; --i)
														
 
															+    {
														
 
															+        sq_pushinteger(v, i);
														
 
															+        sq_get(v, nhidden_pos);
														
 
															+        SQInteger nhidden;
														
 
															+        SQRESULT rc = sq_getinteger(v, -1, &nhidden);
														
 
															+        if(rc != SQ_OK) return sq_throwerror(v, _SC("only integers expected on hidden layers array"));
														
 
															+        layers[num_layers++] = nhidden;
														
 
															+        sq_poptop(v);
														
 
															+    }
														
 
															+
														
 
															+    layers[num_layers++] = ninputs;
														
 
															+    //for(int i=0; i < num_layers; ++i) printf("layers %d : %d\n", i, layers[i]);
														
 
															+
														
 
															+    NRTypeObject *self = createNRTypeObject(flags, layers, num_layers, ndata, ntest);
														
 
															+
														
 
															+    if(self){
														
 
															+        self->flags = flags;
														
 
															+        sq_setinstanceup(v, 1, self);
														
 
															+        sq_setreleasehook(v, 1, sq_nn_release_hook);
														
 
															+        return 1;
														
 
															+    }
														
 
															+    delete self;
														
 
															+    return sq_throwerror(v, _SC("failed to create AnnRprop"));
														
 
															+}
														
 
															+
														
 
															+#define SQ_GET_NN_INSTANCE(v, at) SQ_GET_INSTANCE_VAR(v, at, NRTypeObject, self, sq_nn_TAG)
														
 
															+
														
 
															+static SQRESULT sq_nn_observe(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+    SQ_OPT_INTEGER(v, 4, target, NR_INSERT_NO_TARGET);
														
 
															+
														
 
															+    SQInteger ilen = ANN_INPUT_UNITS(self->nn);
														
 
															+    SQInteger olen = ANN_OUTPUT_UNITS(self->nn);
														
 
															+    SQInteger oargs = (self->flags & NR_FLAG_CLASSIFIER) ? 1 : olen;
														
 
															+
														
 
															+    const SQInteger inputs_pos = 2;
														
 
															+    const SQInteger outputs_pos = 3;
														
 
															+
														
 
															+    SQInteger asize_inputs = sq_getsize(v, inputs_pos);
														
 
															+    SQInteger asize_outputs = sq_getsize(v, outputs_pos);
														
 
															+
														
 
															+    if((ilen != asize_inputs) || (oargs != asize_outputs))
														
 
															+        return sq_throwerror(v, _SC( "number of arguments does not "
														
 
															+            "match the number of " _PRINT_INT_FMT " inputs and " _PRINT_INT_FMT " outputs in the neural network"),
														
 
															+                             ilen, oargs);
														
 
															+
														
 
															+    const SQInteger inputs_alloc_size = sizeof(float)*ilen;
														
 
															+    const SQInteger outputs_alloc_size = sizeof(float)*olen;
														
 
															+
														
 
															+    float *inputs = (float*)sq_malloc(inputs_alloc_size);
														
 
															+    for(SQInteger i=0; i < ilen; ++i)
														
 
															+    {
														
 
															+        sq_pushinteger(v, i);
														
 
															+        sq_get(v, inputs_pos);
														
 
															+        SQFloat fnum;
														
 
															+        SQRESULT rc = sq_getfloat(v, -1, &fnum);
														
 
															+        if(rc != SQ_OK)
														
 
															+        {
														
 
															+            sq_free(inputs, inputs_alloc_size);
														
 
															+            return sq_throwerror(v, _SC("only numbers expected on input array"));
														
 
															+        }
														
 
															+        inputs[i] = fnum;
														
 
															+        sq_poptop(v);
														
 
															+    }
														
 
															+
														
 
															+    float *outputs = (float*)sq_malloc(outputs_alloc_size);
														
 
															+    for(SQInteger i=0; i < oargs; ++i)
														
 
															+    {
														
 
															+        sq_pushinteger(v, i);
														
 
															+        sq_get(v, outputs_pos);
														
 
															+        SQFloat fnum;
														
 
															+        SQRESULT rc = sq_getfloat(v, -1, &fnum);
														
 
															+        if(rc != SQ_OK)
														
 
															+        {
														
 
															+            sq_free(inputs, inputs_alloc_size);
														
 
															+            sq_free(outputs, outputs_alloc_size);
														
 
															+            return sq_throwerror(v, _SC("only numbers expected on output array"));
														
 
															+        }
														
 
															+        if (self->flags & NR_FLAG_CLASSIFIER) {
														
 
															+            int classid = fnum;
														
 
															+            if (classid != fnum || fnum >= olen || fnum < 0) {
														
 
															+                sq_free(inputs, inputs_alloc_size);
														
 
															+                sq_free(outputs, outputs_alloc_size);
														
 
															+                return sq_throwerror(v, _SC("classifier network output must be an integer "
														
 
															+                    "in the range from 0 to outputs-1."));
														
 
															+            }
														
 
															+            memset(outputs,0, outputs_alloc_size);
														
 
															+            outputs[classid] = 1;
														
 
															+        } else {
														
 
															+            outputs[i] = fnum;
														
 
															+        }
														
 
															+
														
 
															+        sq_poptop(v);
														
 
															+    }
														
 
															+
														
 
															+    NRTypeInsertData(self,inputs,outputs,target);
														
 
															+    sq_free(inputs, inputs_alloc_size);
														
 
															+    sq_free(outputs, outputs_alloc_size);
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_nn_train(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+    SQ_OPT_INTEGER(v, 2, opt_max_cycles, 0);
														
 
															+    SQ_OPT_INTEGER(v, 3, opt_max_ms, 10000);
														
 
															+    SQ_OPT_INTEGER(v, 4, opt_flags, 0);
														
 
															+
														
 
															+    NRTypeObject *nr = self;
														
 
															+
														
 
															+    nr->training_max_cycles = opt_max_cycles;
														
 
															+    nr->training_max_ms = opt_max_ms;
														
 
															+    if(opt_flags & NR_FLAG_AUTO_STOP) nr->flags |= NR_FLAG_AUTO_STOP;
														
 
															+    if(opt_flags & NR_FLAG_BACKTRACK) nr->flags |= NR_FLAG_BACKTRACK;
														
 
															+
														
 
															+    /* Overfitting detection compares error rate in testing/training data,
														
 
															+     * so does not work without entries in the testing dataset. */
														
 
															+    if (nr->flags & NR_FLAG_AUTO_STOP && nr->test.len == 0) {
														
 
															+        return sq_throwerror(v, _SC("Can't start training with AUTOSTOP option: "
														
 
															+            "overfitting detection requires a non zero length testing dataset"));
														
 
															+    }
														
 
															+
														
 
															+    int training_iterations = 1;
														
 
															+    float train_error = 0;
														
 
															+    float test_error = 0;
														
 
															+    float class_error = 0;
														
 
															+    float past_train_error = 1.0/0.0;
														
 
															+    float past_test_error = 1.0/0.0;
														
 
															+    int auto_stop = nr->flags & NR_FLAG_AUTO_STOP;
														
 
															+    int backtrack = nr->flags & NR_FLAG_BACKTRACK;
														
 
															+
														
 
															+    uint64_t cycles = 0;
														
 
															+    long long start = NRMilliseconds();
														
 
															+    long long cycle_time;
														
 
															+    int overfitting_count = 0;
														
 
															+    int overfitting_limit = 5;
														
 
															+    float best_test_error = 1.0/0.0;
														
 
															+
														
 
															+    nr->flags &= ~NR_FLAG_TO_TRANSFER;
														
 
															+
														
 
															+    /* If the network is auto normalized, we need to trasnform the inputs
														
 
															+     * in a way that's acceptable for the NN. We just find the maximum
														
 
															+     * absolute value, and divide for it, to get a -1,1 range. There
														
 
															+     * are more advanced transformations that are usually performed that
														
 
															+     * could be implemented in the future.
														
 
															+     *
														
 
															+     * Note that we compute the normalization vectors for all the inputs
														
 
															+     * and outputs, however if the network is a classifier, flagged with
														
 
															+     * (NR_FLAG_CLASSIFIER), no output normalization will be done since
														
 
															+     * the data is already in 0/1 format. */
														
 
															+    if ((nr->flags & NR_FLAG_NORMALIZE) && nr->dataset.len) {
														
 
															+        int ilen = ANN_INPUT_UNITS(nr->nn);
														
 
															+        int olen = ANN_OUTPUT_UNITS(nr->nn);
														
 
															+        float *imax = nr->inorm;
														
 
															+        float *omax = nr->onorm;
														
 
															+        float *inputs = nr->dataset.inputs;
														
 
															+        float *outputs = nr->dataset.outputs;
														
 
															+        for (int i = 0; i < ilen; i++) imax[i] = 1;
														
 
															+        for (int i = 0; i < olen; i++) omax[i] = 1;
														
 
															+
														
 
															+        /* Compute the max values vectors. */
														
 
															+        for (uint32_t j = 0; j < nr->dataset.len; j++) {
														
 
															+            for (int i = 0; i < ilen; i++)
														
 
															+                if (fabs(inputs[i]) > imax[i]) imax[i] = fabs(inputs[i]);
														
 
															+            for (int i = 0; i < olen; i++)
														
 
															+                if (fabs(outputs[i]) > omax[i]) omax[i] = fabs(outputs[i]);
														
 
															+            inputs += ilen;
														
 
															+            outputs += olen;
														
 
															+        }
														
 
															+
														
 
															+        /* Likely we are not seeing what will really be the true input/output
														
 
															+         * maximum value, so we multiply the maximum values found by a constant.
														
 
															+         * However if the max is exactly "1" we assume it's a classification
														
 
															+         * input and don't alter it. */
														
 
															+        for (int i = 0; i < ilen; i++) if (imax[i] != 1) imax[i] *= 1.2;
														
 
															+        for (int i = 0; i < olen; i++) if (omax[i] != 1) omax[i] *= 1.2;
														
 
															+
														
 
															+        /* We can normalize the dataset directly: after the training it will
														
 
															+         * be discarded anyway. */
														
 
															+        inputs = nr->dataset.inputs;
														
 
															+        outputs = nr->dataset.outputs;
														
 
															+        for (uint32_t j = 0; j < nr->dataset.len; j++) {
														
 
															+            for (int i = 0; i < ilen; i++) inputs[i] /= nr->inorm[i];
														
 
															+            if (!(nr->flags & NR_FLAG_CLASSIFIER))
														
 
															+                for (int i = 0; i < olen; i++) outputs[i] /= nr->onorm[i];
														
 
															+            inputs += ilen;
														
 
															+            outputs += olen;
														
 
															+        }
														
 
															+
														
 
															+        inputs = nr->test.inputs;
														
 
															+        outputs = nr->test.outputs;
														
 
															+        for (uint32_t j = 0; j < nr->test.len; j++) {
														
 
															+            for (int i = 0; i < ilen; i++) inputs[i] /= nr->inorm[i];
														
 
															+            if (!(nr->flags & NR_FLAG_CLASSIFIER))
														
 
															+                for (int i = 0; i < olen; i++) outputs[i] /= nr->onorm[i];
														
 
															+            inputs += ilen;
														
 
															+            outputs += olen;
														
 
															+        }
														
 
															+    }
														
 
															+
														
 
															+    AnnRprop *saved = NULL;  /* Saved to recover on overfitting. */
														
 
															+    float saved_error;          /* The test error of the saved NN. */
														
 
															+    float saved_train_error;    /* The training dataset error of the saved NN */
														
 
															+    float saved_class_error;    /* The % of classification errors of saved NN */
														
 
															+
														
 
															+    while(1) {
														
 
															+        long long cycle_start = NRMilliseconds();
														
 
															+
														
 
															+        train_error = AnnTrain(nr->nn,
														
 
															+                               nr->dataset.inputs,
														
 
															+                               nr->dataset.outputs,
														
 
															+                               0,
														
 
															+                               training_iterations,
														
 
															+                               nr->dataset.len,
														
 
															+                               ANN_ALGO_BPROP);
														
 
															+        cycle_time = NRMilliseconds() - cycle_start;
														
 
															+        nr->training_total_steps += nr->dataset.len*training_iterations;
														
 
															+
														
 
															+        /* Evaluate the error in the case of auto training, stop it
														
 
															+         * once we see that the error in the traning set is decreasing
														
 
															+         * while the one in the test set is not. */
														
 
															+        if (auto_stop) {
														
 
															+            AnnTestError(nr->nn,
														
 
															+                         nr->test.inputs,
														
 
															+                         nr->test.outputs,
														
 
															+                         nr->test.len, &test_error, &class_error);
														
 
															+
														
 
															+            if (train_error < past_train_error &&
														
 
															+                test_error > past_test_error)
														
 
															+            {
														
 
															+                overfitting_count++;
														
 
															+                #ifdef NR_TRAINING_DEBUG
														
 
															+                printf("+YCLE %lld: [%d] %f VS %f\n", (long long)cycles,
														
 
															+                    overfitting_count, train_error, test_error);
														
 
															+                #endif
														
 
															+                if (overfitting_count == overfitting_limit) {
														
 
															+                    nr->flags |= NR_FLAG_OF_DETECTED;
														
 
															+                    break;
														
 
															+                }
														
 
															+            } else if (overfitting_count > 0) {
														
 
															+                #ifdef NR_TRAINING_DEBUG
														
 
															+                printf("-YCLE %lld: [%d] %f VS %f\n", (long long)cycles,
														
 
															+                    overfitting_count, train_error, test_error);
														
 
															+                #endif
														
 
															+                overfitting_count--;
														
 
															+            }
														
 
															+
														
 
															+            /* Save all the networks with a score better than the currently
														
 
															+             * saved network. This can be a bit costly, but is safe: one
														
 
															+             * cycle of training more and overfitting can ruin it all. */
														
 
															+            if (backtrack && (saved == NULL || test_error < saved_error)) {
														
 
															+                #ifdef NR_TRAINING_DEBUG
														
 
															+                printf("SAVED! %f < %f\n", test_error, saved_error);
														
 
															+                #endif
														
 
															+                saved_error = test_error;
														
 
															+                saved_train_error = train_error;
														
 
															+                saved_class_error = class_error;
														
 
															+                if (saved) AnnFree(saved);
														
 
															+                saved = AnnClone(nr->nn);
														
 
															+            }
														
 
															+
														
 
															+            /* Best network found? Reset the overfitting hints counter. */
														
 
															+            if (test_error < best_test_error) {
														
 
															+                overfitting_count = 0;
														
 
															+                best_test_error = test_error;
														
 
															+                #ifdef NR_TRAINING_DEBUG
														
 
															+                printf("BEST! %lld: <%d> %f VS %f\n", (long long)cycles,
														
 
															+                    overfitting_limit,train_error, test_error);
														
 
															+                #endif
														
 
															+            }
														
 
															+
														
 
															+           /* Also stop if the loss is zero in both datasets. */
														
 
															+            if (train_error < 0.000000000000001 &&
														
 
															+                test_error  < 0.000000000000001) break;
														
 
															+        }
														
 
															+
														
 
															+        cycles++;
														
 
															+        long long total_time = NRMilliseconds()-start;
														
 
															+
														
 
															+        /* Cycles and milliseconds stop conditions. */
														
 
															+        if (nr->training_max_cycles && cycles == nr->training_max_cycles)
														
 
															+            break;
														
 
															+        if (nr->training_max_ms && total_time > (long long)nr->training_max_ms)
														
 
															+            break;
														
 
															+
														
 
															+        /* If this is a long training, to do just a single training iteration
														
 
															+         * for each cycle is not optimal: tune the number of iterations to
														
 
															+         * at least take 100 milliseconds. */
														
 
															+        if (total_time > 10000 && cycle_time < 100) training_iterations++;
														
 
															+
														
 
															+        past_train_error = train_error;
														
 
															+        past_test_error = test_error;
														
 
															+    }
														
 
															+
														
 
															+    /* If auto stop is disabled, we still need to compute the test error
														
 
															+     * in order to return this information to the main thread. */
														
 
															+    if (!auto_stop) {
														
 
															+        AnnTestError(nr->nn,
														
 
															+                     nr->test.inputs,
														
 
															+                     nr->test.outputs,
														
 
															+                     nr->test.len, &test_error, &class_error);
														
 
															+    }
														
 
															+
														
 
															+    /* If both autostop and backtracking are enabled, we may have
														
 
															+     * a better network saved! */
														
 
															+    if (auto_stop && backtrack) {
														
 
															+        if (saved && saved_error < test_error) {
														
 
															+            #ifdef NR_TRAINING_DEBUG
														
 
															+            printf("BACKTRACK: Saved network used!\n");
														
 
															+            #endif
														
 
															+            AnnFree(nr->nn);
														
 
															+            nr->nn = saved;
														
 
															+            test_error = saved_error;
														
 
															+            train_error = saved_train_error;
														
 
															+            class_error = saved_class_error;
														
 
															+        } else if (saved) {
														
 
															+            AnnFree(saved);
														
 
															+        }
														
 
															+    }
														
 
															+
														
 
															+    if (nr->flags & NR_FLAG_CLASSIFIER) nr->test_class_error = class_error;
														
 
															+    nr->dataset_error = train_error;
														
 
															+    nr->test_error = test_error;
														
 
															+    nr->training_total_ms += NRMilliseconds()-start;
														
 
															+
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_nn_run(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+
														
 
															+    SQInteger asize_inputs = sq_getsize(v, 2);
														
 
															+    SQInteger ilen = ANN_INPUT_UNITS(self->nn);
														
 
															+    if(ilen != asize_inputs)
														
 
															+        return sq_throwerror(v, _SC("wrong number of inputs " _PRINT_INT_FMT " for expected " _PRINT_INT_FMT), asize_inputs, ilen);
														
 
															+
														
 
															+    for(SQInteger i=0; i < ilen; ++i)
														
 
															+    {
														
 
															+        sq_pushinteger(v, i);
														
 
															+        sq_get(v, 2);
														
 
															+        SQFloat fnum;
														
 
															+        SQRESULT rc = sq_getfloat(v, -1, &fnum);
														
 
															+        if(rc != SQ_OK)
														
 
															+        {
														
 
															+            return sq_throwerror(v, _SC("only numbers expected on input array"));
														
 
															+        }
														
 
															+        if (self->flags & NR_FLAG_NORMALIZE) fnum /= self->inorm[i];
														
 
															+        ANN_INPUT_NODE(self->nn,i) = fnum;
														
 
															+        sq_poptop(v);
														
 
															+    }
														
 
															+    AnnSimulate(self->nn);
														
 
															+
														
 
															+    /* Output the raw net output or the class ID if the network
														
 
															+     * is a classifier and the command invoked was NR.CLASS. */
														
 
															+    int olen = ANN_OUTPUT_UNITS(self->nn);
														
 
															+    sq_newarray(v, olen);
														
 
															+    for(int j = 0; j < olen; j++) {
														
 
															+        float output = ANN_OUTPUT_NODE(self->nn,j);
														
 
															+        if (!(self->flags & NR_FLAG_CLASSIFIER) &&
														
 
															+             (self->flags & NR_FLAG_NORMALIZE))
														
 
															+        {
														
 
															+            output *= self->onorm[j];
														
 
															+        }
														
 
															+        sq_pushfloat(v, output);
														
 
															+        sq_arrayset(v, -2, j);
														
 
															+    }
														
 
															+
														
 
															+    return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_nn_classify(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+
														
 
															+    if (!(self->flags & NR_FLAG_CLASSIFIER))
														
 
															+        return sq_throwerror(v, _SC("you can't call classify with a regressor network."));
														
 
															+
														
 
															+    SQInteger asize_inputs = sq_getsize(v, 2);
														
 
															+    SQInteger ilen = ANN_INPUT_UNITS(self->nn);
														
 
															+    if(ilen != asize_inputs)
														
 
															+        return sq_throwerror(v, _SC("wrong number of inputs %d for expected %d"), (int)asize_inputs, (int)ilen);
														
 
															+
														
 
															+    for(SQInteger i=0; i < ilen; ++i)
														
 
															+    {
														
 
															+        sq_pushinteger(v, i);
														
 
															+        sq_get(v, 2);
														
 
															+        SQFloat fnum;
														
 
															+        SQRESULT rc = sq_getfloat(v, -1, &fnum);
														
 
															+        if(rc != SQ_OK)
														
 
															+        {
														
 
															+            return sq_throwerror(v, _SC("only numbers expected on input array"));
														
 
															+        }
														
 
															+        if (self->flags & NR_FLAG_NORMALIZE) fnum /= self->inorm[i];
														
 
															+        ANN_INPUT_NODE(self->nn,i) = fnum;
														
 
															+        sq_poptop(v);
														
 
															+    }
														
 
															+    AnnSimulate(self->nn);
														
 
															+
														
 
															+    /* Output the raw net output or the class ID if the network
														
 
															+     * is a classifier and the command invoked was NR.CLASS. */
														
 
															+    int olen = ANN_OUTPUT_UNITS(self->nn);
														
 
															+    float fmax = ANN_OUTPUT_NODE(self->nn,0);
														
 
															+    int max_class = 0;
														
 
															+    for(int j = 1; j < olen; j++) {
														
 
															+        float output = ANN_OUTPUT_NODE(self->nn,j);
														
 
															+        if (output > fmax) {
														
 
															+            fmax = output;
														
 
															+            max_class = j;
														
 
															+        }
														
 
															+    }
														
 
															+    sq_pushinteger(v, max_class);
														
 
															+
														
 
															+    return 1;
														
 
															+}
														
 
															+
														
 
															+#define ADD_T_TABLE_STR(sk, sv) \
														
 
															+    sq_pushstring(v, sk, -1); \
														
 
															+    sq_pushstring(v, sv, -1); \
														
 
															+    sq_rawset(v, -3);
														
 
															+
														
 
															+#define ADD_T_TABLE_INT(sk, sv) \
														
 
															+    sq_pushstring(v, sk, -1); \
														
 
															+    sq_pushinteger(v, sv); \
														
 
															+    sq_rawset(v, -3);
														
 
															+
														
 
															+#define ADD_T_TABLE_FLOAT(sk, sv) \
														
 
															+    sq_pushstring(v, sk, -1); \
														
 
															+    sq_pushfloat(v, sv); \
														
 
															+    sq_rawset(v, -3);
														
 
															+
														
 
															+static SQRESULT sq_nn_info(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+
														
 
															+    sq_newtable(v);
														
 
															+
														
 
															+    ADD_T_TABLE_INT("id", self->id);
														
 
															+    ADD_T_TABLE_STR("type", (self->flags & NR_FLAG_CLASSIFIER) ? "classifier" : "regressor");
														
 
															+    ADD_T_TABLE_INT("auto-normalization", !!(self->flags & NR_FLAG_NORMALIZE));
														
 
															+    ADD_T_TABLE_INT("training", !!(self->flags & NR_FLAG_TRAINING));
														
 
															+
														
 
															+    sq_pushliteral(v, _SC("layout"));
														
 
															+    sq_newarray(v, ANN_LAYERS(self->nn));
														
 
															+    for (int ai=0, i = ANN_LAYERS(self->nn)-1; i >= 0; i--, ++ai) {
														
 
															+        int units = ANN_UNITS(self->nn,i);
														
 
															+        if (i != 0) units--; /* Don't count the bias unit. */
														
 
															+        sq_pushinteger(v, units);
														
 
															+        sq_arrayset(v, -2, ai);
														
 
															+    }
														
 
															+    sq_rawset(v, -3);
														
 
															+
														
 
															+    ADD_T_TABLE_INT("training-dataset-maxlen", self->dataset.maxlen);
														
 
															+    ADD_T_TABLE_INT("training-dataset-len", self->dataset.len);
														
 
															+    ADD_T_TABLE_INT("test-dataset-maxlen", self->test.maxlen);
														
 
															+    ADD_T_TABLE_INT("test-dataset-len", self->test.len);
														
 
															+    ADD_T_TABLE_INT("training-total-steps", self->training_total_steps);
														
 
															+    ADD_T_TABLE_INT("training-total-cycles", self->dataset.len ?
														
 
															+            (self->training_total_steps / self->dataset.len) : 0);
														
 
															+
														
 
															+    float tms = (float)self->training_total_ms/1000;
														
 
															+    ADD_T_TABLE_FLOAT("training-total-seconds", tms);
														
 
															+    ADD_T_TABLE_FLOAT("dataset-error", self->dataset_error);
														
 
															+    ADD_T_TABLE_FLOAT("test-error", self->test_error);
														
 
															+
														
 
															+    if (self->flags & NR_FLAG_CLASSIFIER) {
														
 
															+        ADD_T_TABLE_FLOAT("classification-errors-perc", self->test_class_error);
														
 
															+    }
														
 
															+
														
 
															+    ADD_T_TABLE_STR("overfitting-detected", (self->flags & NR_FLAG_OF_DETECTED) ? "yes" : "no");
														
 
															+
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_nn_clone(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+    AnnRprop *clone = AnnClone(self->nn);
														
 
															+    if(clone)
														
 
															+    {
														
 
															+        sq_pushstring(v, sq_nn_TAG, -1);
														
 
															+        if(sq_getonregistrytable(v) == SQ_ERROR) return SQ_ERROR;
														
 
															+        sq_createinstance(v, -1);
														
 
															+        sq_setinstanceup(v, -1, clone);
														
 
															+        sq_setreleasehook(v, -1, sq_nn_release_hook);
														
 
															+    }
														
 
															+    else sq_pushnull(v);
														
 
															+	return 1;
														
 
															+}
														
 
															+
														
 
															+#define SQ_NN_GET_SET_FLOAT(func_name) \
														
 
															+static SQRESULT sq_nn_##func_name(HSQUIRRELVM v)\
														
 
															+{\
														
 
															+    SQ_FUNC_VARS(v);\
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);\
														
 
															+    if(_top_ == 1)\
														
 
															+    {\
														
 
															+        sq_pushfloat(v, self->nn->func_name);\
														
 
															+        return 1;\
														
 
															+    }\
														
 
															+    SQ_GET_FLOAT(v, 2, func_name);\
														
 
															+    self->nn->func_name = func_name;\
														
 
															+	return 0;\
														
 
															+}
														
 
															+
														
 
															+SQ_NN_GET_SET_FLOAT(learn_rate);
														
 
															+SQ_NN_GET_SET_FLOAT(rprop_nminus);
														
 
															+SQ_NN_GET_SET_FLOAT(rprop_nplus);
														
 
															+SQ_NN_GET_SET_FLOAT(rprop_maxupdate);
														
 
															+SQ_NN_GET_SET_FLOAT(rprop_minupdate);
														
 
															+
														
 
															+static SQRESULT sq_nn_flags(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+    if(_top_ == 1)
														
 
															+    {
														
 
															+        sq_pushinteger(v, self->nn->flags);
														
 
															+        return 1;
														
 
															+    }
														
 
															+    SQ_GET_INTEGER(v, 2, flags);
														
 
															+    self->nn->flags = flags;
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_nn_weights(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+    sq_pushfloat(v, AnnCountWeights(self->nn));
														
 
															+    return 1;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_nn_weight(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+    SQ_GET_INTEGER(v, 2, layer);
														
 
															+    SQ_GET_INTEGER(v, 3, i);
														
 
															+    SQ_GET_INTEGER(v, 4, j);
														
 
															+
														
 
															+    if(layer < 0 && layer >= self->nn->layers) return sq_throwerror(v, _SC("layer out of range"));
														
 
															+    //if(i < 0 && i >= self->layer[layer]) return sq_throwerror(v, _("layer out of range"));
														
 
															+
														
 
															+    float *weight = &ANN_WEIGHT(self->nn, layer, i, j);
														
 
															+    if(_top_ == 4)
														
 
															+    {
														
 
															+        sq_pushfloat(v, *weight);
														
 
															+        return 1;
														
 
															+    }
														
 
															+    SQ_GET_FLOAT(v, 5, new_weight);
														
 
															+    *weight = new_weight;
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_nn_Ann2Tcl(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+    Ann2Tcl(self->nn);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_nn_Ann2Js(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+    Ann2Js(self->nn);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_nn_AnnPrint(HSQUIRRELVM v)
														
 
															+{
														
 
															+    SQ_FUNC_VARS_NO_TOP(v);
														
 
															+    SQ_GET_NN_INSTANCE(v, 1);
														
 
															+    AnnPrint(self->nn);
														
 
															+	return 0;
														
 
															+}
														
 
															+
														
 
															+#define _DECL_FUNC(name,nparams,tycheck) {_SC(#name),sq_nn_##name,nparams,tycheck}
														
 
															+static SQRegFunction sq_nn_methods[] =
														
 
															+{
														
 
															+    _DECL_FUNC(constructor, -5,_SC("xiiaiii")),
														
 
															+    _DECL_FUNC(clone, 1,_SC("x")),
														
 
															+    _DECL_FUNC(Ann2Tcl, 1,_SC("x")),
														
 
															+    _DECL_FUNC(Ann2Js, 1,_SC("x")),
														
 
															+    _DECL_FUNC(AnnPrint, 1,_SC("x")),
														
 
															+    _DECL_FUNC(flags, -1,_SC("xi")),
														
 
															+    _DECL_FUNC(learn_rate, -1,_SC("xf")),
														
 
															+    _DECL_FUNC(rprop_nminus, -1,_SC("xf")),
														
 
															+    _DECL_FUNC(rprop_nplus, -1,_SC("xf")),
														
 
															+    _DECL_FUNC(rprop_maxupdate, -1,_SC("xf")),
														
 
															+    _DECL_FUNC(rprop_minupdate, -1,_SC("xf")),
														
 
															+    _DECL_FUNC(weights, 1,_SC("x")),
														
 
															+    _DECL_FUNC(weight, -4,_SC("xiiif")),
														
 
															+    _DECL_FUNC(observe, -3,_SC("xaai")),
														
 
															+    _DECL_FUNC(train, -1,_SC("xiii")),
														
 
															+    _DECL_FUNC(run, 2,_SC("xa")),
														
 
															+    _DECL_FUNC(classify, 2,_SC("xa")),
														
 
															+    _DECL_FUNC(info, 1,_SC("x")),
														
 
															+    {0,0}
														
 
															+};
														
 
															+#undef _DECL_FUNC
														
 
															+
														
 
															+typedef struct {
														
 
															+  const SQChar *Str;
														
 
															+  SQInteger Val;
														
 
															+} KeyIntType, * KeyIntPtrType;
														
 
															+
														
 
															+static KeyIntType sqpcre2_constants[] = {
														
 
															+    #define MK_CONST(c) {_SC(#c), NR_##c}
														
 
															+    #define MK_CONST_FLAG(c) {_SC(#c), NR_FLAG_##c}
														
 
															+
														
 
															+	MK_CONST_FLAG(NONE),
														
 
															+	MK_CONST_FLAG(TRAINING),
														
 
															+	MK_CONST_FLAG(REGRESSOR),
														
 
															+	MK_CONST_FLAG(CLASSIFIER),
														
 
															+	MK_CONST_FLAG(NORMALIZE),
														
 
															+	MK_CONST_FLAG(AUTO_STOP),
														
 
															+	MK_CONST_FLAG(OF_DETECTED),
														
 
															+	MK_CONST_FLAG(BACKTRACK),
														
 
															+	MK_CONST_FLAG(TO_PERSIST),
														
 
															+	MK_CONST_FLAG(TO_TRANSFER),
														
 
															+	MK_CONST(MAX_LAYERS),
														
 
															+	MK_CONST(RDB_ENC_VER),
														
 
															+	MK_CONST(INSERT_TRAIN),
														
 
															+	MK_CONST(INSERT_TEST),
														
 
															+    {0,0}
														
 
															+};
														
 
															+
														
 
															+#ifdef __cplusplus
														
 
															+extern "C" {
														
 
															+#endif
														
 
															+/* This defines a function that opens up your library. */
														
 
															+SQRESULT sqext_register_nn (HSQUIRRELVM v) {
														
 
															+	sq_pushstring(v,sq_nn_TAG,-1);
														
 
															+	sq_newclass(v,SQFalse);
														
 
															+	sq_settypetag(v,-1,(void*)sq_nn_TAG);
														
 
															+    sq_insert_reg_funcs(v, sq_nn_methods);
														
 
															+
														
 
															+	//add constants
														
 
															+	KeyIntPtrType KeyIntPtr;
														
 
															+	for (KeyIntPtr = sqpcre2_constants; KeyIntPtr->Str; KeyIntPtr++) {
														
 
															+		sq_pushstring(v, KeyIntPtr->Str, -1);    //first the key
														
 
															+		sq_pushinteger(v, KeyIntPtr->Val);       //then the value
														
 
															+		sq_newslot(v, -3, SQFalse);              //store then
														
 
															+	}
														
 
															+
														
 
															+	sq_newslot(v,-3,SQTrue);
														
 
															+
														
 
															+	return SQ_OK;
														
 
															+}
														
 
															+
														
 
															+#ifdef __cplusplus
														
 
															+}
														
 
															+#endif
														
 
															+
														
 
															+
														
--- a/SquiLu-ext/sq_subprocess.cpp
+++ b/SquiLu-ext/sq_subprocess.cpp
@@ -0,0 +1,1365 @@
 
															+/* Copyright (c) 2010 Joshua Phillips
														
 
															+ * Ported on 2016 to SquiLu by Domingo Alvarez Duarte
														
 
															+ *
														
 
															+ * Permission is hereby granted, free of charge, to any person obtaining a copy
														
 
															+ * of this software and associated documentation files (the "Software"), to deal
														
 
															+ * in the Software without restriction, including without limitation the rights
														
 
															+ * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
														
 
															+ * copies of the Software, and to permit persons to whom the Software is
														
 
															+ * furnished to do so, subject to the following conditions:
														
 
															+ *
														
 
															+ * The above copyright notice and this permission notice shall be included in
														
 
															+ * all copies or substantial portions of the Software.
														
 
															+ *
														
 
															+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
														
 
															+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
														
 
															+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
														
 
															+ * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
														
 
															+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
														
 
															+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
														
 
															+ * THE SOFTWARE.
														
 
															+ */
														
 
															+
														
 
															+#ifdef OS_POSIX
														
 
															+#define _POSIX_SOURCE
														
 
															+#endif
														
 
															+
														
 
															+#if !defined(OS_WINDOWS) && !defined(OS_POSIX)
														
 
															+#error None of these are defined: OS_WINDOWS, OS_POSIX
														
 
															+#else
														
 
															+
														
 
															+#include "squirrel.h"
														
 
															+#include "sqstdblobimpl.h"
														
 
															+
														
 
															+#include <string.h>
														
 
															+#include <stdio.h>
														
 
															+#include <stdlib.h>
														
 
															+#include <errno.h>
														
 
															+#include <fcntl.h>
														
 
															+#include <assert.h>
														
 
															+SQ_OPT_STRING_STRLEN();
														
 
															+
														
 
															+#if defined(OS_POSIX)
														
 
															+#include <unistd.h>
														
 
															+#include <sys/wait.h>
														
 
															+#include <sys/stat.h>
														
 
															+typedef int filedes_t;
														
 
															+
														
 
															+/* return 1 if the named directory exists and is a directory */
														
 
															+static int direxists(const char *fname)
														
 
															+{
														
 
															+    struct stat statbuf;
														
 
															+    if (stat(fname, &statbuf)){
														
 
															+        return 0;
														
 
															+    }
														
 
															+    return !!S_ISDIR(statbuf.st_mode);
														
 
															+}
														
 
															+
														
 
															+#elif defined(OS_WINDOWS)
														
 
															+#include "windows.h"
														
 
															+
														
 
															+/* Some SDKs don't define this */
														
 
															+#ifndef INVALID_FILE_ATTRIBUTES
														
 
															+#define INVALID_FILE_ATTRIBUTES ((DWORD) -1)
														
 
															+#endif
														
 
															+
														
 
															+typedef HANDLE filedes_t;
														
 
															+
														
 
															+/* return 1 if the named directory exists and is a directory */
														
 
															+static int direxists(const char *fname)
														
 
															+{
														
 
															+    DWORD result;
														
 
															+    result = GetFileAttributes(fname);
														
 
															+    if (result == INVALID_FILE_ATTRIBUTES) return 0;
														
 
															+    return !!(result & FILE_ATTRIBUTE_DIRECTORY);
														
 
															+}
														
 
															+
														
 
															+#endif /* defined(OS_WINDOWS) */
														
 
															+
														
 
															+/* Some systems don't define these, but we use them as indices for our arrays.
														
 
															+   I probably oughtn't, in case a system doesn't use 0, 1 and 2 for these. */
														
 
															+#ifndef STDIN_FILENO
														
 
															+#define STDIN_FILENO 0
														
 
															+#define STDOUT_FILENO 1
														
 
															+#define STDERR_FILENO 2
														
 
															+#endif
														
 
															+
														
 
															+/* This is the proc object, which is stored as Lua userdata */
														
 
															+struct proc {
														
 
															+#if defined(OS_POSIX)
														
 
															+    pid_t pid;
														
 
															+#elif defined(OS_WINDOWS)
														
 
															+    DWORD pid;
														
 
															+    HANDLE hProcess;
														
 
															+#endif
														
 
															+    int exitcode;
														
 
															+    unsigned char done; /* set to 1 when child has finished and closed */
														
 
															+};
														
 
															+
														
 
															+/* Lua registry key for proc metatable */
														
 
															+#define SP_PROC_META "subprocess_proc*"
														
 
															+
														
 
															+/* Environment keys */
														
 
															+/* This is an integer index into the environment of C functions in this module.
														
 
															+   At this index is stored a table of [pid]=proc items. The items in this table
														
 
															+   will all have their `done` fields set to false. This table is at present only
														
 
															+   used for the `subprocess.wait` function.
														
 
															+   On POSIX, it is used to get the proc object corresponding to a pid. On
														
 
															+   Windows, it is used to assemble a HANDLE array for WaitForMultipleObjects. */
														
 
															+#define SP_LIST "subprocess_pid_list"
														
 
															+
														
 
															+/* Check to see if object at the given index is a proc object.
														
 
															+   Return pointer to proc object, or NULL if it isn't. */
														
 
															+static struct proc *toproc(HSQUIRRELVM v, int index)
														
 
															+{
														
 
															+    int eq;
														
 
															+    if (lua_type(L, index) != LUA_TUSERDATA) return NULL;
														
 
															+    lua_getmetatable(L, index);
														
 
															+    luaL_getmetatable(L, SP_PROC_META);
														
 
															+    eq = lua_equal(L, -2, -1);
														
 
															+    lua_pop(L, 2);
														
 
															+    if (!eq) return NULL;
														
 
															+    return lua_touserdata(L, index);
														
 
															+}
														
 
															+
														
 
															+/* Same but raise an error instead of returning NULL */
														
 
															+#define checkproc(L, index) ((struct proc *) luaL_checkudata((L), (index), SP_PROC_META))
														
 
															+
														
 
															+/* Create and return a new proc object */
														
 
															+static struct proc *newproc(HSQUIRRELVM v)
														
 
															+{
														
 
															+    struct proc *proc = sq_newuserdata(v, sizeof *proc);
														
 
															+    proc->done = 1;
														
 
															+    proc->pid = 0;
														
 
															+    luaL_getmetatable(L, SP_PROC_META);
														
 
															+    lua_setmetatable(L, -2);
														
 
															+    lua_newtable(L);
														
 
															+    lua_setfenv(L, -2);
														
 
															+    return proc;
														
 
															+}
														
 
															+
														
 
															+/* Mark a process (at index) as done */
														
 
															+static void doneproc(HSQUIRRELVM v, int index)
														
 
															+{
														
 
															+    struct proc *proc = toproc(L, index);
														
 
															+    if (!proc){
														
 
															+        fputs("subprocess.c: doneproc: not a proc\n", stderr);
														
 
															+    } else {
														
 
															+        proc->done = 1;
														
 
															+        /* remove proc from SP_LIST */
														
 
															+        sq_reservestack(v, 4);
														
 
															+        sq_pushvalue(v, index);    /* stack: proc */
														
 
															+        luaL_getmetatable(L, SP_LIST);
														
 
															+        /* stack: proc list */
														
 
															+        if (lua_isnil(L, -1)){
														
 
															+            fputs("subprocess.c: XXX: SP_LIST IS NIL\n", stderr);
														
 
															+        } else {
														
 
															+            lua_pushinteger(L, proc->pid);      /* stack: proc list pid */
														
 
															+            lua_pushvalue(L, -1);               /* stack: proc list pid pid */
														
 
															+            lua_gettable(L, -3);                /* stack: proc list pid proc2 */
														
 
															+            if (!lua_equal(L, -4, -1)){
														
 
															+                /* lookup by pid didn't work */
														
 
															+                fputs("subprocess.c: doneproc: XXX: pid lookup in SP_LIST failed\n", stderr);
														
 
															+                lua_pop(L, 2);                  /* stack: proc list */
														
 
															+            } else {
														
 
															+                lua_pop(L, 1);                  /* stack: proc list pid */
														
 
															+                lua_pushnil(L);                 /* stack: proc list pid nil */
														
 
															+                lua_settable(L, -3);            /* stack: proc list */
														
 
															+            }
														
 
															+            /* stack: proc list */
														
 
															+        }
														
 
															+        sq_pop(v, 2);
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Remove old SP_LIST entries by polling them.
														
 
															+   Calling this every now and again can avoid leaking proc objects
														
 
															+   that are not waited for. */
														
 
															+static SQRESULT sq_subprocess_prune(HSQUIRRELVM v)
														
 
															+{
														
 
															+    int top = lua_gettop(L);
														
 
															+    sq_reservestack(v, 5);
														
 
															+    luaL_getmetatable(L, SP_LIST);
														
 
															+    if (lua_isnil(L, -1)){
														
 
															+        lua_pop(L, 1);
														
 
															+        return 0;
														
 
															+    }
														
 
															+    lua_pushnil(L);
														
 
															+    while (lua_next(L, -2)){
														
 
															+        lua_getfield(L, -1, "poll");
														
 
															+        lua_pushvalue(L, -2);
														
 
															+        lua_call(L, 1, 0);
														
 
															+        lua_pop(L, 1);
														
 
															+    }
														
 
															+    lua_settop(L, top);
														
 
															+    return 0;
														
 
															+}
														
 
															+
														
 
															+/* Special constants for popen arguments. */
														
 
															+static char PIPE, STDOUT;
														
 
															+
														
 
															+/* Names of standard file handles. */
														
 
															+static const char *fd_names[3] = {"stdin", "stdout", "stderr"};
														
 
															+
														
 
															+/* Information about what to do for a standard file handle.
														
 
															+   This is constructed from popen arguments. */
														
 
															+struct fdinfo {
														
 
															+    enum {
														
 
															+        FDMODE_INHERIT = 0,  /* fd is inherited from parent */
														
 
															+        FDMODE_FILENAME,     /* open named file */
														
 
															+        FDMODE_FILEDES,      /* use a file descriptor */
														
 
															+        FDMODE_FILEOBJ,      /* use FILE* */
														
 
															+        FDMODE_PIPE,         /* create and use pipe */
														
 
															+        FDMODE_STDOUT        /* redirect to stdout (only for stderr) */
														
 
															+    } mode;
														
 
															+    union {
														
 
															+        const char *filename;
														
 
															+        filedes_t filedes;
														
 
															+        FILE *fileobj;
														
 
															+    } info;
														
 
															+};
														
 
															+
														
 
															+/* Close multiple file descriptors */
														
 
															+static void closefds(filedes_t *fds, int n)
														
 
															+{
														
 
															+    int i;
														
 
															+    for (i=0; i<n; ++i){
														
 
															+#if defined(OS_POSIX)
														
 
															+        if (fds[i] != -1)
														
 
															+            close(fds[i]);
														
 
															+#elif defined(OS_WINDOWS)
														
 
															+        if (fds[i] != INVALID_HANDLE_VALUE)
														
 
															+            CloseHandle(fds[i]);
														
 
															+#endif
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Close multiple C files */
														
 
															+static void closefiles(FILE **files, int n)
														
 
															+{
														
 
															+    int i;
														
 
															+    for (i=0; i<n; ++i)
														
 
															+        if (files[i] != NULL)
														
 
															+            fclose(files[i]);
														
 
															+}
														
 
															+
														
 
															+/* Free multiple strings */
														
 
															+static void freestrings(char **strs, int n)
														
 
															+{
														
 
															+    int i;
														
 
															+    for (i=0; i<n; ++i)
														
 
															+        if (strs[i] != NULL)
														
 
															+            sq_free(strs[i], -1);
														
 
															+}
														
 
															+
														
 
															+#ifdef OS_WINDOWS
														
 
															+/* Copy a Windows error into a buffer */
														
 
															+static void copy_w32error(char errmsg_out[], size_t errmsg_len, DWORD error)
														
 
															+{
														
 
															+    if (FormatMessage(
														
 
															+        FORMAT_MESSAGE_FROM_SYSTEM, NULL, error, 0,
														
 
															+        (void *) errmsg_out, errmsg_len, NULL) == 0)
														
 
															+    {
														
 
															+        strncpy(errmsg_out, "failed to get error message", errmsg_len + 1);
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Push a Windows error onto a Lua stack */
														
 
															+static void push_w32error(HSQUIRRELVM v, DWORD error)
														
 
															+{
														
 
															+    LPTSTR buf;
														
 
															+    if (FormatMessage(
														
 
															+        FORMAT_MESSAGE_ALLOCATE_BUFFER | FORMAT_MESSAGE_FROM_SYSTEM,
														
 
															+        NULL, error, 0, (void *) &buf, 1, NULL) == 0)
														
 
															+    {
														
 
															+        lua_pushliteral(L, "failed to get error message");
														
 
															+    } else {
														
 
															+        lua_pushstring(L, buf);
														
 
															+        LocalFree(buf);
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* n is 0, 1 or 2
														
 
															+   return handle for standard input/output/error */
														
 
															+static HANDLE getstdhandle(int n)
														
 
															+{
														
 
															+    DWORD n2;
														
 
															+    switch (n){
														
 
															+        case 0: n2 = STD_INPUT_HANDLE; break;
														
 
															+        case 1: n2 = STD_OUTPUT_HANDLE; break;
														
 
															+        case 2: n2 = STD_ERROR_HANDLE; break;
														
 
															+        default: return INVALID_HANDLE_VALUE;
														
 
															+    }
														
 
															+    return GetStdHandle(n2);
														
 
															+}
														
 
															+
														
 
															+struct str {
														
 
															+    char *data;
														
 
															+    size_t len;
														
 
															+    size_t size; /* size allocated */
														
 
															+};
														
 
															+
														
 
															+static void str_init(struct str *s)
														
 
															+{
														
 
															+    s->data = NULL;
														
 
															+    s->len = 0;
														
 
															+    s->size = 0;
														
 
															+}
														
 
															+
														
 
															+/* Append n chars from s2 */
														
 
															+static int str_appendlstr(struct str *s, char *s2, size_t n)
														
 
															+{
														
 
															+    void *newp;
														
 
															+    if (s->size < s->len + n){
														
 
															+        if (s->size < 16) s->size = 16;
														
 
															+        while (s->size < s->len + n)
														
 
															+            s->size = (s->size * 3) / 2;
														
 
															+        newp = realloc(s->data, s->size + 1);
														
 
															+        if (newp == NULL){
														
 
															+            free(s->data);
														
 
															+            return 0;
														
 
															+        }
														
 
															+        s->data = newp;
														
 
															+    }
														
 
															+    memcpy(s->data + s->len, s2, n);
														
 
															+    s->len += n;
														
 
															+    s->data[s->len] = '\0';
														
 
															+    return 1;
														
 
															+}
														
 
															+
														
 
															+static int str_appendc(struct str *s, char ch)
														
 
															+{
														
 
															+    return str_appendlstr(s, &ch, 1);
														
 
															+}
														
 
															+
														
 
															+/* Compiles command line for CreateProcess. Returns malloc'd string. */
														
 
															+static char *compile_cmdline(const char *const *args)
														
 
															+{
														
 
															+    /*  "      --> \"
														
 
															+        \"     --> \\\"
														
 
															+        \<NUL> --> \\    */
														
 
															+    struct str str;
														
 
															+    const char *arg;
														
 
															+    str_init(&str);
														
 
															+    while (*args != NULL){
														
 
															+        arg = *args++;
														
 
															+        if (!str_appendc(&str, '"')) return NULL;
														
 
															+        while (arg[0]){
														
 
															+            if (arg[0] == '"'){
														
 
															+                if (!str_appendlstr(&str, "\\\"", 2)) return NULL;
														
 
															+            } else if (arg[0] == '\\'){
														
 
															+                if (arg[1] == '"' || arg[1] == '\0'){
														
 
															+                    if (!str_appendlstr(&str, "\\\\", 2)) return NULL;
														
 
															+                } else {
														
 
															+                    if (!str_appendc(&str, '\\')) return NULL;
														
 
															+                }
														
 
															+            } else {
														
 
															+                if (!str_appendc(&str, arg[0])) return NULL;
														
 
															+            }
														
 
															+            arg++;
														
 
															+        }
														
 
															+        if (!str_appendlstr(&str, "\" ", 2)) return NULL;
														
 
															+    }
														
 
															+    str.data[str.len - 1] = '\0';
														
 
															+    return str.data;
														
 
															+}
														
 
															+#endif
														
 
															+
														
 
															+/* Function for opening subprocesses. Returns 0 on success and -1 on failure.
														
 
															+   On failure, errmsg_out shall contain a '\0'-terminated error message. */
														
 
															+static int dopopen(const char *const *args,  /* program arguments with NULL sentinel */
														
 
															+                   const char *executable,   /* actual executable */
														
 
															+                   struct fdinfo fdinfo[3],  /* info for stdin/stdout/stderr */
														
 
															+                   int close_fds,            /* 1 to close all fds */
														
 
															+                   int binary,               /* 1 to use binary files */
														
 
															+                   const char *cwd,          /* working directory for program */
														
 
															+                   struct proc *proc,        /* populated on success! */
														
 
															+                   FILE *pipe_ends_out[3],   /* pipe ends are put here */
														
 
															+                   char errmsg_out[],        /* written to on failure */
														
 
															+                   size_t errmsg_len         /* length of errmsg_out (EXCLUDING sentinel) */
														
 
															+                  )
														
 
															+#if defined(OS_POSIX)
														
 
															+{
														
 
															+    int fds[3];
														
 
															+    int i;
														
 
															+    struct fdinfo *fdi;
														
 
															+    int piperw[2];
														
 
															+    int errpipe[2]; /* pipe for returning error status */
														
 
															+    int flags;
														
 
															+    int en; /* saved errno */
														
 
															+    int count;
														
 
															+    pid_t pid;
														
 
															+
														
 
															+    errmsg_out[errmsg_len] = '\0';
														
 
															+
														
 
															+    for (i=0; i<3; ++i)
														
 
															+        pipe_ends_out[i] = NULL;
														
 
															+
														
 
															+    /* Manage stdin/stdout/stderr */
														
 
															+    for (i=0; i<3; ++i){
														
 
															+        fdi = &fdinfo[i];
														
 
															+        switch (fdi->mode){
														
 
															+            case FDMODE_INHERIT:
														
 
															+inherit:
														
 
															+                fds[i] = dup(i);
														
 
															+                if (fds[i] == -1){
														
 
															+fd_failure:
														
 
															+                    strncpy(errmsg_out, strerror(errno), errmsg_len + 1);
														
 
															+                    closefds(fds, i);
														
 
															+                    closefiles(pipe_ends_out, i);
														
 
															+                    return -1;
														
 
															+                }
														
 
															+                break;
														
 
															+            case FDMODE_FILENAME:
														
 
															+                if (i == STDIN_FILENO){
														
 
															+                    if ((fds[i] = open(fdi->info.filename, O_RDONLY)) == -1) goto fd_failure;
														
 
															+                } else {
														
 
															+                    if ((fds[i] = creat(fdi->info.filename, 0666)) == -1) goto fd_failure;
														
 
															+                }
														
 
															+                break;
														
 
															+            case FDMODE_FILEDES:
														
 
															+                if ((fds[i] = dup(fdi->info.filedes)) == -1) goto fd_failure;
														
 
															+                break;
														
 
															+            case FDMODE_FILEOBJ:
														
 
															+                if ((fds[i] = dup(fileno(fdi->info.fileobj))) == -1) goto fd_failure;
														
 
															+                break;
														
 
															+            case FDMODE_PIPE:
														
 
															+                if (pipe(piperw) == -1) goto fd_failure;
														
 
															+                if (i == STDIN_FILENO){
														
 
															+                    fds[i] = piperw[0]; /* give read end to process */
														
 
															+                    if ((pipe_ends_out[i] = fdopen(piperw[1], "w")) == NULL) goto fd_failure;
														
 
															+                } else {
														
 
															+                    fds[i] = piperw[1]; /* give write end to process */
														
 
															+                    if ((pipe_ends_out[i] = fdopen(piperw[0], "r")) == NULL) goto fd_failure;
														
 
															+                }
														
 
															+                break;
														
 
															+            case FDMODE_STDOUT:
														
 
															+                if (i == STDERR_FILENO){
														
 
															+                    if ((fds[STDERR_FILENO] = dup(fds[STDOUT_FILENO])) == -1) goto fd_failure;
														
 
															+                } else goto inherit;
														
 
															+                break;
														
 
															+        }
														
 
															+    }
														
 
															+
														
 
															+    /* Find executable name */
														
 
															+    if (!executable){
														
 
															+        /* use first arg */
														
 
															+        executable = args[0];
														
 
															+    }
														
 
															+    assert(executable != NULL);
														
 
															+
														
 
															+    /* Create a pipe for returning error status */
														
 
															+    if (pipe(errpipe) == -1){
														
 
															+        strncpy(errmsg_out, strerror(errno), errmsg_len + 1);
														
 
															+        closefds(fds, 3);
														
 
															+        closefiles(pipe_ends_out, 3);
														
 
															+        return -1;
														
 
															+    }
														
 
															+    /* Make write end close on exec */
														
 
															+    flags = fcntl(errpipe[1], F_GETFD);
														
 
															+    if (flags == -1){
														
 
															+pipe_failure:
														
 
															+        strncpy(errmsg_out, strerror(errno), errmsg_len + 1);
														
 
															+        closefds(errpipe, 2);
														
 
															+        closefds(fds, 3);
														
 
															+        closefiles(pipe_ends_out, 3);
														
 
															+        return -1;
														
 
															+    }
														
 
															+    if (fcntl(errpipe[1], F_SETFD, flags | FD_CLOEXEC) == -1) goto pipe_failure;
														
 
															+
														
 
															+    /* Do the fork/exec (TODO: use vfork somehow?) */
														
 
															+    pid = fork();
														
 
															+    if (pid == -1) goto pipe_failure;
														
 
															+    else if (pid == 0){
														
 
															+        /* child */
														
 
															+        close(errpipe[0]);
														
 
															+
														
 
															+        /* dup file descriptors */
														
 
															+        for (i=0; i<3; ++i){
														
 
															+            if (dup2(fds[i], i) == -1) goto child_failure;
														
 
															+        }
														
 
															+
														
 
															+        /* close other fds */
														
 
															+        if (close_fds){
														
 
															+            for (i=3; i<sysconf(_SC_OPEN_MAX); ++i){
														
 
															+                if (i != errpipe[1])
														
 
															+                    close(i);
														
 
															+            }
														
 
															+        }
														
 
															+
														
 
															+        /* change directory */
														
 
															+        if (cwd && chdir(cwd)) goto child_failure;
														
 
															+
														
 
															+        /* exec! Farewell, subprocess.c! */
														
 
															+        execvp(executable, (char *const*) args); /* XXX: const cast */
														
 
															+
														
 
															+        /* Oh dear, we're still here. */
														
 
															+child_failure:
														
 
															+        en = errno;
														
 
															+        write(errpipe[1], &en, sizeof en);
														
 
															+        _exit(1);
														
 
															+    }
														
 
															+
														
 
															+    /* parent */
														
 
															+    /* close unneeded fds */
														
 
															+    closefds(fds, 3);
														
 
															+    close(errpipe[1]);
														
 
															+
														
 
															+    /* read errno from child */
														
 
															+    while ((count = read(errpipe[0], &en, sizeof en)) == -1)
														
 
															+        if (errno != EAGAIN && errno != EINTR) break;
														
 
															+    if (count > 0){
														
 
															+        /* exec failed */
														
 
															+        close(errpipe[0]);
														
 
															+        strncpy(errmsg_out, strerror(en), errmsg_len + 1);
														
 
															+        return -1;
														
 
															+    }
														
 
															+    close(errpipe[0]);
														
 
															+
														
 
															+    /* Child is now running */
														
 
															+    proc->done = 0;
														
 
															+    proc->pid = pid;
														
 
															+    return 0;
														
 
															+}
														
 
															+#elif defined(OS_WINDOWS)
														
 
															+{
														
 
															+    HANDLE hfiles[3], piper, pipew, hfile;
														
 
															+    int i, fd;
														
 
															+    struct fdinfo *fdi;
														
 
															+    SECURITY_ATTRIBUTES secattr;
														
 
															+    STARTUPINFO si;
														
 
															+    PROCESS_INFORMATION pi;
														
 
															+    char *cmdline;
														
 
															+
														
 
															+    errmsg_out[errmsg_len] = '\0';
														
 
															+
														
 
															+    /* Create a SECURITY_ATTRIBUTES for inheritable handles */
														
 
															+    secattr.nLength = sizeof secattr;
														
 
															+    secattr.lpSecurityDescriptor = NULL;
														
 
															+    secattr.bInheritHandle = TRUE;
														
 
															+
														
 
															+    for (i=0; i<3; ++i)
														
 
															+        pipe_ends_out[i] = NULL;
														
 
															+
														
 
															+    /* Manage stdin/stdout/stderr */
														
 
															+    for (i=0; i<3; ++i){
														
 
															+        fdi = &fdinfo[i];
														
 
															+        switch (fdi->mode){
														
 
															+            case FDMODE_INHERIT:
														
 
															+inherit:
														
 
															+                /* XXX: duplicated file handles share the
														
 
															+                   same object (and thus file cursor, etc.).
														
 
															+                   CreateFile might be a better idea. */
														
 
															+                hfile = getstdhandle(i);
														
 
															+                if (hfile == INVALID_HANDLE_VALUE){
														
 
															+fd_failure:
														
 
															+                    copy_w32error(errmsg_out, errmsg_len, GetLastError());
														
 
															+                    closefds(hfiles, i);
														
 
															+                    closefiles(pipe_ends_out, i);
														
 
															+                    return -1;
														
 
															+                }
														
 
															+dup_hfile:
														
 
															+                if (DuplicateHandle(GetCurrentProcess(), hfile,
														
 
															+                    GetCurrentProcess(), &hfiles[i], 0, TRUE,
														
 
															+                    DUPLICATE_SAME_ACCESS) == 0)
														
 
															+                {
														
 
															+                    goto fd_failure;
														
 
															+                }
														
 
															+                break;
														
 
															+            case FDMODE_FILENAME:
														
 
															+                if (i == STDIN_FILENO){
														
 
															+                    hfiles[i] = CreateFile(
														
 
															+                        fdi->info.filename,
														
 
															+                        GENERIC_READ,
														
 
															+                        FILE_SHARE_READ | FILE_SHARE_WRITE | FILE_SHARE_DELETE,
														
 
															+                        &secattr,
														
 
															+                        OPEN_EXISTING,
														
 
															+                        FILE_ATTRIBUTE_NORMAL,
														
 
															+                        NULL);
														
 
															+                } else {
														
 
															+                    hfiles[i] = CreateFile(
														
 
															+                        fdi->info.filename,
														
 
															+                        GENERIC_WRITE,
														
 
															+                        FILE_SHARE_READ | FILE_SHARE_WRITE | FILE_SHARE_DELETE,
														
 
															+                        &secattr,
														
 
															+                        CREATE_ALWAYS,
														
 
															+                        FILE_ATTRIBUTE_NORMAL,
														
 
															+                        NULL);
														
 
															+                }
														
 
															+                if (hfiles[i] == INVALID_HANDLE_VALUE){
														
 
															+                    goto fd_failure;
														
 
															+                }
														
 
															+                break;
														
 
															+            case FDMODE_FILEDES:
														
 
															+                if (DuplicateHandle(GetCurrentProcess(), fdi->info.filedes,
														
 
															+                    GetCurrentProcess(), &hfiles[i], 0, TRUE,
														
 
															+                    DUPLICATE_SAME_ACCESS) == 0)
														
 
															+                {
														
 
															+                    goto fd_failure;
														
 
															+                }
														
 
															+                break;
														
 
															+            case FDMODE_FILEOBJ:
														
 
															+                fd = _fileno(fdi->info.fileobj);
														
 
															+                if (fd == -1){
														
 
															+get_osf_failure:
														
 
															+                    strncpy(errmsg_out, strerror(errno), errmsg_len + 1);
														
 
															+failure:
														
 
															+                    closefds(hfiles, i);
														
 
															+                    closefiles(pipe_ends_out, i);
														
 
															+                    return -1;
														
 
															+                }
														
 
															+                hfile = (HANDLE) _get_osfhandle(fd);
														
 
															+                if (hfile == INVALID_HANDLE_VALUE) goto get_osf_failure;
														
 
															+                goto dup_hfile;
														
 
															+            case FDMODE_PIPE:
														
 
															+                if (CreatePipe(&piper, &pipew, &secattr, 0) == 0)
														
 
															+                    goto fd_failure;
														
 
															+                if (i == STDIN_FILENO){
														
 
															+                    hfiles[i] = piper;
														
 
															+                    fd = _open_osfhandle((long) pipew, binary ? 0 : _O_TEXT);
														
 
															+                    if (fd == -1){
														
 
															+                        strncpy(errmsg_out, "_open_osfhandle failed", errmsg_len + 1);
														
 
															+                        goto failure;
														
 
															+                    }
														
 
															+                    pipe_ends_out[i] = _fdopen(fd, "w");
														
 
															+                    if (pipe_ends_out[i] == 0){
														
 
															+                        strncpy(errmsg_out, "_fdopen failed", errmsg_len + 1);
														
 
															+                        goto failure;
														
 
															+                    }
														
 
															+                } else {
														
 
															+                    hfiles[i] = pipew;
														
 
															+                    fd = _open_osfhandle((long) piper, _O_RDONLY | (binary ? 0 : _O_TEXT));
														
 
															+                    if (fd == -1){
														
 
															+                        strncpy(errmsg_out, "_open_osfhandle failed", errmsg_len + 1);
														
 
															+                        goto failure;
														
 
															+                    }
														
 
															+                    pipe_ends_out[i] = _fdopen(fd, "r");
														
 
															+                    if (pipe_ends_out[i] == 0){
														
 
															+                        strncpy(errmsg_out, "_fdopen failed", errmsg_len + 1);
														
 
															+                        goto failure;
														
 
															+                    }
														
 
															+                }
														
 
															+                break;
														
 
															+            case FDMODE_STDOUT:
														
 
															+                if (i == STDERR_FILENO){
														
 
															+                    hfile = hfiles[STDOUT_FILENO];
														
 
															+                    goto dup_hfile;
														
 
															+                } else goto inherit;
														
 
															+        }
														
 
															+    }
														
 
															+
														
 
															+    /* Find executable name */
														
 
															+    if (executable == NULL){
														
 
															+        /* use first arg */
														
 
															+        /*executable = args[0];*/
														
 
															+    }
														
 
															+
														
 
															+    /* Compile command line into string. Yuck. */
														
 
															+    cmdline = compile_cmdline(args);
														
 
															+    if (!cmdline){
														
 
															+        strncpy(errmsg_out, "memory full", errmsg_len + 1);
														
 
															+        closefds(hfiles, 3);
														
 
															+        closefiles(pipe_ends_out, 3);
														
 
															+        return -1;
														
 
															+    }
														
 
															+
														
 
															+
														
 
															+    si.cb = sizeof si;
														
 
															+    si.lpReserved = NULL;
														
 
															+    si.lpDesktop = NULL;
														
 
															+    si.lpTitle = NULL;
														
 
															+    si.dwFlags = STARTF_USESTDHANDLES;
														
 
															+    si.cbReserved2 = 0;
														
 
															+    si.lpReserved2 = NULL;
														
 
															+    si.hStdInput = hfiles[0];
														
 
															+    si.hStdOutput = hfiles[1];
														
 
															+    si.hStdError = hfiles[2];
														
 
															+
														
 
															+    if (CreateProcess(
														
 
															+        executable, /* lpApplicationName */
														
 
															+        cmdline,    /* lpCommandLine */
														
 
															+        NULL,       /* lpProcessAttributes */
														
 
															+        NULL,       /* lpThreadAttributes */
														
 
															+        TRUE,       /* bInheritHandles */
														
 
															+        0,          /* dwCreationFlags */
														
 
															+        NULL,       /* lpEnvironment */
														
 
															+        cwd,        /* lpCurrentDirectory */
														
 
															+        &si,        /* lpStartupInfo */
														
 
															+        &pi)        /* lpProcessInformation */
														
 
															+    == 0){
														
 
															+        copy_w32error(errmsg_out, errmsg_len, GetLastError());
														
 
															+        free(cmdline);
														
 
															+        closefds(hfiles, 3);
														
 
															+        closefiles(pipe_ends_out, 3);
														
 
															+        return -1;
														
 
															+    }
														
 
															+    CloseHandle(pi.hThread); /* Don't want this handle */
														
 
															+    free(cmdline);
														
 
															+    closefds(hfiles, 3); /* XXX: is this correct? */
														
 
															+    proc->done = 0;
														
 
															+    proc->pid = pi.dwProcessId;
														
 
															+    proc->hProcess = pi.hProcess;
														
 
															+    return 0;
														
 
															+}
														
 
															+#endif
														
 
															+
														
 
															+/* popen {arg0, arg1, arg2, ..., [executable=...]} */
														
 
															+static SQRESULT sq_subprocess_popen(HSQUIRRELVM v)
														
 
															+{
														
 
															+    struct proc *proc = NULL;
														
 
															+
														
 
															+    /* List of arguments (malloc'd NULL-terminated array of C strings.
														
 
															+       The C strings are owned by Lua) */
														
 
															+    int nargs = 0;
														
 
															+    const char **args = NULL;
														
 
															+    /* Command to run (owned by Lua) */
														
 
															+    const char *executable = NULL;
														
 
															+    /* Directory to run it in (owned by Lua) */
														
 
															+    const char *cwd = NULL;
														
 
															+    /* File options */
														
 
															+    struct fdinfo fdinfo[3];
														
 
															+    /* Close fds? */
														
 
															+    int close_fds = 0;
														
 
															+    /* Use binary mode for files? */
														
 
															+    int binary = 0;
														
 
															+
														
 
															+    FILE *pipe_ends[3] = {NULL, NULL, NULL};
														
 
															+    int i, result;
														
 
															+    FILE *f;
														
 
															+    const char *s;
														
 
															+
														
 
															+    char errmsg_buf[256];
														
 
															+
														
 
															+    prune(v);
														
 
															+
														
 
															+    luaL_checktype(L, 1, LUA_TTABLE);
														
 
															+    lua_settop(L, 1);
														
 
															+
														
 
															+    proc = newproc(v);
														
 
															+
														
 
															+    /* Stack: kwargs proc <strings etc....>
														
 
															+       Lua strings are left on the stack while they are needed,
														
 
															+       and Lua can garbage-collect them later. */
														
 
															+
														
 
															+    /* get arguments */
														
 
															+    nargs = lua_objlen(L, 1);
														
 
															+    if (nargs == 0) return luaL_error(L, "no arguments specified");
														
 
															+    args = lua_newuserdata(L, (nargs + 1) * sizeof *args); /*alloc((nargs + 1) * sizeof *args);*/
														
 
															+    if (!args) return luaL_error(L, "memory full");
														
 
															+    for (i=0; i<=nargs; ++i) args[i] = NULL;
														
 
															+    luaL_checkstack(L, nargs, "cannot grow stack");
														
 
															+    for (i=1; i<=nargs; ++i){
														
 
															+        lua_rawgeti(L, 1, i);
														
 
															+        s = lua_tostring(L, -1);
														
 
															+        if (!s){
														
 
															+            /*freestrings(args, nargs);
														
 
															+            free(args);*/
														
 
															+            return luaL_error(L, "popen argument %d not a string", (int) i);
														
 
															+
														
 
															+        }
														
 
															+        args[i-1] = s; /*strdup(s);*/
														
 
															+        /*if (args[i-1] == NULL){
														
 
															+strings_failure:
														
 
															+            freestrings(args, nargs);
														
 
															+            free(args);
														
 
															+            return luaL_error(L, "memory full");
														
 
															+        } */
														
 
															+        /*lua_pop(L, 1);*/
														
 
															+    }
														
 
															+
														
 
															+    luaL_checkstack(L, 12, "cannot grow stack");
														
 
															+
														
 
															+    /* get executable string */
														
 
															+    lua_getfield(L, 1, "executable");
														
 
															+    s = lua_tostring(L, -1);
														
 
															+    if (s){
														
 
															+        executable = s; /*strdup(s);*/
														
 
															+        /*if (executable == NULL) goto strings_failure;*/
														
 
															+    } else lua_pop(L, 1);
														
 
															+    /*lua_pop(L, 1); */ /* to match lua_getfield */
														
 
															+
														
 
															+    /* get directory name */
														
 
															+    lua_getfield(L, 1, "cwd");
														
 
															+    cwd = lua_tostring(L, -1);
														
 
															+    if (cwd == NULL) lua_pop(L, 1);
														
 
															+    else {
														
 
															+    /*if (lua_isstring(L, -1)){
														
 
															+        cwd = lua_tostring(L, -1);*/ /*strdup(lua_tostring(L, -1));
														
 
															+        if (!cwd){
														
 
															+            free(executable);
														
 
															+            freestrings(args, nargs);
														
 
															+            free(args);
														
 
															+            return luaL_error(L, "memory full");
														
 
															+        }                            */
														
 
															+        /* make sure the cwd exists */
														
 
															+        if (!direxists(cwd)){
														
 
															+            /*free(executable);
														
 
															+            freestrings(args, nargs);*/
														
 
															+            /*free(args);*/
														
 
															+            return luaL_error(L, "directory `%s' does not exist", cwd);
														
 
															+        }
														
 
															+    }
														
 
															+    /*lua_pop(L, 1);*/
														
 
															+
														
 
															+    /* close_fds */
														
 
															+    lua_getfield(L, 1, "close_fds");
														
 
															+    close_fds = lua_toboolean(L, -1);
														
 
															+    lua_pop(L, 1);
														
 
															+
														
 
															+    /* binary */
														
 
															+    lua_getfield(L, 1, "binary");
														
 
															+    binary = lua_toboolean(L, -1);
														
 
															+    lua_pop(L, 1);
														
 
															+
														
 
															+    /* handle stdin/stdout/stderr */
														
 
															+    for (i=0; i<3; ++i){
														
 
															+        lua_getfield(L, 1, fd_names[i]);
														
 
															+        if (lua_isnil(L, -1)){
														
 
															+            fdinfo[i].mode = FDMODE_INHERIT;
														
 
															+            lua_pop(L, 1);
														
 
															+        } else if (lua_touserdata(L, -1) == &PIPE){
														
 
															+            fdinfo[i].mode = FDMODE_PIPE;
														
 
															+            lua_pop(L, 1);
														
 
															+        } else if (lua_touserdata(L, -1) == &STDOUT){
														
 
															+            if (i == STDERR_FILENO /*&& fdinfo[STDOUT_FILENO].mode == FDMODE_PIPE*/){
														
 
															+                fdinfo[i].mode = FDMODE_STDOUT;
														
 
															+            } else {
														
 
															+                lua_pushliteral(L, "STDOUT must be used only for stderr"/* when stdout is set to PIPE"*/);
														
 
															+files_failure:
														
 
															+                /*for (j=0; j<i; ++j){
														
 
															+                    if (fdinfo[j].mode == FDMODE_FILENAME)
														
 
															+                        free(fdinfo[j].info.filename);
														
 
															+                }
														
 
															+                free(executable);
														
 
															+                freestrings(args, nargs);
														
 
															+                free(args);*/
														
 
															+                return lua_error(L);
														
 
															+            }
														
 
															+            lua_pop(L, 1);
														
 
															+        } else if (lua_isstring(L, -1)){
														
 
															+            /* open a file */
														
 
															+            fdinfo[i].mode = FDMODE_FILENAME;
														
 
															+            /*if ((fdinfo[i].info.filename = strdup(lua_tostring(L, -1))) == NULL){
														
 
															+                lua_pushliteral(L, "out of memory");
														
 
															+                goto files_failure;
														
 
															+            } */
														
 
															+            fdinfo[i].info.filename = lua_tostring(L, -1);
														
 
															+            /* do not pop */
														
 
															+        } else if (lua_isnumber(L, -1)){
														
 
															+            /* use this fd */
														
 
															+            fdinfo[i].mode = FDMODE_FILEDES;
														
 
															+            fdinfo[i].info.filedes = (filedes_t) lua_tointeger(L, -1);
														
 
															+            lua_pop(L, 1);
														
 
															+        } else {
														
 
															+            f = liolib_copy_tofile(L, -1);
														
 
															+            if (f){
														
 
															+                fdinfo[i].mode = FDMODE_FILEOBJ;
														
 
															+                fdinfo[i].info.fileobj = f;
														
 
															+            } else {
														
 
															+                /* huh? */
														
 
															+                lua_pushfstring(L, "unexpected value for %s", fd_names[i]);
														
 
															+                goto files_failure;
														
 
															+            }
														
 
															+            lua_pop(L, 1);
														
 
															+        }
														
 
															+    }
														
 
															+
														
 
															+    result = dopopen(args, executable, fdinfo, close_fds, binary, cwd, proc, pipe_ends, errmsg_buf, 255);
														
 
															+    /*for (i=0; i<3; ++i)
														
 
															+        if (fdinfo[i].mode == FDMODE_FILENAME)
														
 
															+            free(fdinfo[i].info.filename);
														
 
															+    free(executable);
														
 
															+    freestrings(args, nargs);
														
 
															+    free(args);*/
														
 
															+    if (result == -1){
														
 
															+        /* failed */
														
 
															+        return luaL_error(L, "popen failed: %s", errmsg_buf);
														
 
															+    }
														
 
															+
														
 
															+    /* Put pipe objects in proc userdata's environment */
														
 
															+    lua_getfenv(L, 2);
														
 
															+    for (i=0; i<3; ++i){
														
 
															+        if (pipe_ends[i]){
														
 
															+            *liolib_copy_newfile(L) = pipe_ends[i];
														
 
															+            lua_setfield(L, -2, fd_names[i]);
														
 
															+        }
														
 
															+    }
														
 
															+    lua_pop(L, 1);
														
 
															+
														
 
															+    /* Put proc object in SP_LIST table */
														
 
															+    luaL_getmetatable(L, SP_LIST);
														
 
															+    if (lua_isnil(L, -1)){
														
 
															+        fputs("subprocess.c: XXX: SP_LIST IS NIL\n", stderr);
														
 
															+    } else {
														
 
															+        lua_pushinteger(L, proc->pid); /* stack: list pid */
														
 
															+        lua_pushvalue(L, 2);           /* stack: list pid proc */
														
 
															+        lua_settable(L, -3);           /* stack: list */
														
 
															+    }
														
 
															+    lua_pop(L, 1);
														
 
															+
														
 
															+    /* Return the proc */
														
 
															+    lua_settop(L, 2);
														
 
															+    return 1;
														
 
															+}
														
 
															+
														
 
															+/* __gc */
														
 
															+static int proc_gc(HSQUIRRELVM v)
														
 
															+{
														
 
															+    struct proc *proc = checkproc(v, 1);
														
 
															+    if (!proc->done){
														
 
															+#if defined(OS_POSIX)
														
 
															+        /* Try to wait for process to avoid leaving zombie.
														
 
															+           If the process hasn't finished yet, we'll end up leaving a zombie. */
														
 
															+        int stat;
														
 
															+        waitpid(proc->pid, &stat, WNOHANG);
														
 
															+#elif defined(OS_WINDOWS)
														
 
															+        CloseHandle(proc->hProcess);
														
 
															+#endif
														
 
															+        doneproc(v, 1);
														
 
															+    }
														
 
															+    return 0;
														
 
															+}
														
 
															+
														
 
															+/* __index */
														
 
															+static int proc_index(HSQUIRRELVM v)
														
 
															+{
														
 
															+    struct proc *proc;
														
 
															+    const char *s;
														
 
															+    lua_settop(L, 2);
														
 
															+    proc = checkproc(v, 1);
														
 
															+    /* first check environment table */
														
 
															+    lua_getfenv(L, 1);
														
 
															+    lua_pushvalue(L, 2);
														
 
															+    lua_gettable(L, 3);
														
 
															+    if (!lua_isnil(L, 4)) return 1;
														
 
															+    lua_pop(L, 2);
														
 
															+    /* next check metatable */
														
 
															+    lua_getmetatable(L, 1);
														
 
															+    lua_pushvalue(L, 2);
														
 
															+    lua_gettable(L, 3);
														
 
															+    if (!lua_isnil(L, 4)) return 1;
														
 
															+    lua_pop(L, 2);
														
 
															+    /* lastly, fixed fields */
														
 
															+    s = lua_tostring(L, 2);
														
 
															+    if (!strcmp(s, "pid")){
														
 
															+        lua_pushinteger(L, proc->pid);
														
 
															+        return 1;
														
 
															+    } else if (!strcmp(s, "exitcode") && proc->done){
														
 
															+        lua_pushinteger(L, proc->exitcode);
														
 
															+        return 1;
														
 
															+    } else {
														
 
															+        return 0;
														
 
															+    }
														
 
															+}
														
 
															+
														
 
															+/* Push string representation of process on stack */
														
 
															+static int proc_tostring(HSQUIRRELVM v)
														
 
															+{
														
 
															+    struct proc *proc = checkproc(L, 1);
														
 
															+    if (proc->done)
														
 
															+        lua_pushliteral(L, "(finished process)");
														
 
															+    else
														
 
															+        lua_pushfstring(L, "process (%d)", (int) proc->pid);
														
 
															+    return 1;
														
 
															+}
														
 
															+
														
 
															+#if defined(OS_POSIX)
														
 
															+/* Get exitcode from wait's 'stat' value */
														
 
															+static int getexitcode(int stat)
														
 
															+{
														
 
															+    if (WIFEXITED(stat))
														
 
															+        return WEXITSTATUS(stat);
														
 
															+    else if (WIFSIGNALED(stat))
														
 
															+        return -WTERMSIG(stat);
														
 
															+    else if (WIFSTOPPED(stat))
														
 
															+        return -WSTOPSIG(stat);
														
 
															+    else {
														
 
															+        fputs("child disappeared into black hole\n", stderr);
														
 
															+        return -1;
														
 
															+    }
														
 
															+}
														
 
															+#endif
														
 
															+
														
 
															+/* Wait for, or poll, a process */
														
 
															+static int do_waitpid(HSQUIRRELVM v, struct proc *proc, int wait)
														
 
															+#if defined(OS_POSIX)
														
 
															+{
														
 
															+    int stat, options;
														
 
															+
														
 
															+    if (proc->done){
														
 
															+        lua_pushinteger(L, proc->exitcode);
														
 
															+        return 1;
														
 
															+    }
														
 
															+
														
 
															+    if (wait) options = 0;
														
 
															+    else options = WNOHANG;
														
 
															+    switch (waitpid(proc->pid, &stat, options)){
														
 
															+        case -1:
														
 
															+            return luaL_error(L, strerror(errno));
														
 
															+        case 0:
														
 
															+            /* child still running */
														
 
															+            lua_pushnil(L);
														
 
															+            return 1;
														
 
															+        default:
														
 
															+            proc->exitcode = getexitcode(stat);
														
 
															+            doneproc(L, 1);
														
 
															+            lua_pushinteger(L, proc->exitcode);
														
 
															+            return 1;
														
 
															+    }
														
 
															+}
														
 
															+#elif defined(OS_WINDOWS)
														
 
															+{
														
 
															+    DWORD dwMilliseconds, retval, exitcode;
														
 
															+
														
 
															+    if (proc->done){
														
 
															+        lua_pushinteger(L, proc->exitcode);
														
 
															+        return 1;
														
 
															+    }
														
 
															+    if (wait) dwMilliseconds = INFINITE;
														
 
															+    else dwMilliseconds = 0;
														
 
															+    retval = WaitForSingleObject(proc->hProcess, dwMilliseconds);
														
 
															+    switch (retval){
														
 
															+        case WAIT_FAILED:
														
 
															+failure:
														
 
															+            push_w32error(L, GetLastError());
														
 
															+            return lua_error(L);
														
 
															+        case WAIT_OBJECT_0:
														
 
															+            /* child finished */
														
 
															+            if (GetExitCodeProcess(proc->hProcess, &exitcode) == 0){
														
 
															+                goto failure;
														
 
															+            }
														
 
															+            CloseHandle(proc->hProcess);
														
 
															+            proc->exitcode = exitcode;
														
 
															+            doneproc(L, 1);
														
 
															+            lua_pushinteger(L, proc->exitcode);
														
 
															+            return 1;
														
 
															+        case WAIT_TIMEOUT:
														
 
															+        default:
														
 
															+            /* child still running */
														
 
															+            lua_pushnil(L);
														
 
															+            return 1;
														
 
															+    }
														
 
															+}
														
 
															+#endif
														
 
															+
														
 
															+static int SQRESULT sq_process_poll(HSQUIRRELVM v)
														
 
															+{
														
 
															+    return do_waitpid(L, checkproc(L, 1), 0);
														
 
															+}
														
 
															+
														
 
															+static int SQRESULT sq_process_wait(HSQUIRRELVM v)
														
 
															+{
														
 
															+    return do_waitpid(L, checkproc(L, 1), 1);
														
 
															+}
														
 
															+
														
 
															+#if defined(OS_POSIX)
														
 
															+static SQRESULT sq_process_send_signal(HSQUIRRELVM v)
														
 
															+{
														
 
															+    struct proc *proc = checkproc(L, 1);
														
 
															+    int sig = luaL_checkinteger(L, 2);
														
 
															+    if (!proc->done){
														
 
															+        if (kill(proc->pid, sig)){
														
 
															+            return luaL_error(L, "kill: %s", strerror(errno));
														
 
															+        }
														
 
															+        proc->exitcode = -sig;
														
 
															+        doneproc(L, 1);
														
 
															+    }
														
 
															+    return 0;
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_process_terminate(HSQUIRRELVM v)
														
 
															+{
														
 
															+    lua_settop(L, 1);
														
 
															+    lua_pushinteger(L, SIGTERM);
														
 
															+    return proc_send_signal(L);
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_process_kill(HSQUIRRELVM v)
														
 
															+{
														
 
															+    lua_settop(L, 1);
														
 
															+    lua_pushinteger(L, SIGKILL);
														
 
															+    return proc_send_signal(L);
														
 
															+}
														
 
															+#elif defined(OS_WINDOWS)
														
 
															+static SQRESULT sq_process_terminate(HSQUIRRELVM v)
														
 
															+{
														
 
															+    struct proc *proc = checkproc(L, 1);
														
 
															+    if (!proc->done){
														
 
															+        if (TerminateProcess(proc->hProcess, -9) == 0){
														
 
															+            push_w32error(L, GetLastError());
														
 
															+            return lua_error(L);
														
 
															+        }
														
 
															+        CloseHandle(proc->hProcess);
														
 
															+        proc->exitcode = -9;
														
 
															+        doneproc(L, 1);
														
 
															+    }
														
 
															+    return 0;
														
 
															+}
														
 
															+#endif
														
 
															+
														
 
															+static const luaL_Reg proc_meta[] = {
														
 
															+    {"__tostring", proc_tostring},
														
 
															+    {"__gc", proc_gc},
														
 
															+    {"__index", proc_index},
														
 
															+    {"poll", proc_poll},
														
 
															+    {"wait", proc_wait},
														
 
															+#if defined(OS_POSIX)
														
 
															+    {"send_signal", proc_send_signal},
														
 
															+    {"terminate", proc_terminate},
														
 
															+    {"kill", proc_kill},
														
 
															+#elif defined(OS_WINDOWS)
														
 
															+    {"terminate", proc_terminate},
														
 
															+    {"kill", proc_terminate},
														
 
															+#endif
														
 
															+    {NULL, NULL}
														
 
															+};
														
 
															+
														
 
															+#define _DECL_FUNC(name,nparams,tycheck) {_SC(#name),  sq_process_##name,nparams,tycheck}
														
 
															+static SQRegFunction sq_process_methods[] =
														
 
															+{
														
 
															+    _DECL_FUNC(constructor,  -2, _SC("xsi")),
														
 
															+    _DECL_FUNC(poll,  1, _SC("x")),
														
 
															+    _DECL_FUNC(wait,  1, _SC("x")),
														
 
															+#if defined(OS_POSIX)
														
 
															+    _DECL_FUNC(send_signal,  1, _SC("x")),
														
 
															+    _DECL_FUNC(terminate,  1, _SC("x")),
														
 
															+    _DECL_FUNC(kill,  1, _SC("x")),
														
 
															+#elif defined(OS_WINDOWS)
														
 
															+    _DECL_FUNC(terminate,  1, _SC("x")),
														
 
															+    _DECL_FUNC(kill,  1, _SC("x")),
														
 
															+#endif
														
 
															+
														
 
															+    {0,0}
														
 
															+};
														
 
															+#undef _DECL_FUNC
														
 
															+
														
 
															+/* convenience functions */
														
 
															+static SQRESULT sq_subprocess_call(HSQUIRRELVM v)
														
 
															+{
														
 
															+    int r = superpopen(L);
														
 
															+    if (r != 1){
														
 
															+        return r;
														
 
															+    }
														
 
															+    lua_replace(L, 1);
														
 
															+    lua_settop(L, 1);
														
 
															+    return proc_wait(L);
														
 
															+}
														
 
															+
														
 
															+static SQRESULT sq_subprocess_call_capture(HSQUIRRELVM v)
														
 
															+{
														
 
															+    int r;
														
 
															+    lua_settop(L, 1);
														
 
															+    luaL_checktype(L, 1, LUA_TTABLE);
														
 
															+    lua_getfield(L, 1, "stdout");
														
 
															+    lua_pushlightuserdata(L, &PIPE);
														
 
															+    lua_setfield(L, 1, "stdout");
														
 
															+    r = superpopen(L);
														
 
															+    if (r != 1) return r;
														
 
															+    /* stack: args oldstdout sp */
														
 
															+    /* restore old stdout value in table */
														
 
															+    lua_pushvalue(L, 2);
														
 
															+    lua_setfield(L, 1, "stdout");
														
 
															+    lua_replace(L, 1);
														
 
															+    lua_settop(L, 1);
														
 
															+    /* stack: sp */
														
 
															+    lua_getfield(L, 1, "stdout");
														
 
															+    lua_getfield(L, 2, "read");
														
 
															+    lua_pushvalue(L, 2);
														
 
															+    lua_pushliteral(L, "*a");
														
 
															+    lua_call(L, 2, 2);
														
 
															+    /* stack: sp stdout a b */
														
 
															+    /* close stdout, rather than relying on GC */
														
 
															+    lua_getfield(L, 2, "close");
														
 
															+    lua_pushvalue(L, 2);
														
 
															+    lua_call(L, 1, 0);
														
 
															+    /* wait for child (to avoid leaving a zombie) */
														
 
															+    lua_getfield(L, 1, "wait");
														
 
															+    lua_pushvalue(L, 1);
														
 
															+    lua_call(L, 1, 1);
														
 
															+    /* return exitcode, content */
														
 
															+    lua_pushvalue(L, 3);
														
 
															+    return 2;
														
 
															+}
														
 
															+
														
 
															+/* Miscellaneous */
														
 
															+
														
 
															+static SQRESULT sq_subprocess_wait(HSQUIRRELVM v)
														
 
															+{
														
 
															+    struct proc *proc;
														
 
															+#if defined(OS_POSIX)
														
 
															+    int stat;
														
 
															+    pid_t pid;
														
 
															+    int exitcode;
														
 
															+#elif defined(OS_WINDOWS)
														
 
															+    HANDLE *handles = NULL, hProcess;
														
 
															+    int i, nprocs;
														
 
															+    DWORD retval;
														
 
															+    DWORD exitcode;
														
 
															+#endif
														
 
															+
														
 
															+    luaL_getmetatable(L, SP_LIST);
														
 
															+    if (lua_isnil(L, -1))
														
 
															+        return luaL_error(L, "SP_LIST is nil");
														
 
															+#if defined(OS_POSIX)
														
 
															+    pid = wait(&stat);
														
 
															+    if (pid == -1){
														
 
															+        lua_pushnil(L);
														
 
															+        lua_pushstring(L, strerror(errno));
														
 
															+        return 2;
														
 
															+    }
														
 
															+    exitcode = getexitcode(stat);
														
 
															+    /* find proc object corresponding to pid */
														
 
															+    lua_pushinteger(L, pid);
														
 
															+    lua_pushvalue(L, -1);    /* stack: list pid pid */
														
 
															+    lua_gettable(L, -3);     /* stack: list pid proc */
														
 
															+    if (lua_isnil(L, -1)){
														
 
															+        fprintf(stderr, "subprocess.c: XXX: cannot find proc object for pid %d\n", (int) pid);
														
 
															+    }
														
 
															+    lua_replace(L, -3);     /* stack: proc pid */
														
 
															+    lua_pop(L, 1);          /* stack: proc */
														
 
															+    /* update proc object */
														
 
															+    proc = toproc(L, -1);
														
 
															+    if (!proc){
														
 
															+        fputs("subprocess.c: XXX: proc list entry is wrong type\n", stderr);
														
 
															+    } else {
														
 
															+        proc->exitcode = exitcode;
														
 
															+        doneproc(L, -1);
														
 
															+    }
														
 
															+    lua_pushinteger(L, exitcode);
														
 
															+    lua_pushinteger(L, pid);
														
 
															+    /* stack: proc exitcode pid */
														
 
															+    return 3;
														
 
															+#elif defined(OS_WINDOWS)
														
 
															+    /* count number of procs there are */
														
 
															+    nprocs = sq_getsize(v, -1);
														
 
															+    /* stack: list */
														
 
															+    if (nprocs > 0){
														
 
															+        handles = malloc(nprocs * sizeof *handles);
														
 
															+        if (!handles)
														
 
															+            return luaL_error(L, "memory full");
														
 
															+        i = 0;
														
 
															+        lua_pushnil(L);
														
 
															+        while (lua_next(L, -2)){
														
 
															+            proc = toproc(L, -1);
														
 
															+            if (proc && !proc->done && i < nprocs){
														
 
															+                handles[i++] = proc->hProcess;
														
 
															+            } else if (proc && !proc->done){
														
 
															+                fputs("subprocess.c: XXX: handles array allocated too small\n", stderr);
														
 
															+            } else if (!proc){
														
 
															+                fputs("foreign object in SP_LIST\n", stderr);
														
 
															+            }
														
 
															+            lua_pop(L, 1);
														
 
															+        }
														
 
															+    } else i = 0;
														
 
															+    if (i > 0){
														
 
															+        if (i > MAXIMUM_WAIT_OBJECTS){
														
 
															+            free(handles);
														
 
															+            return luaL_error(L, "too many wait objects: %d", i);
														
 
															+        }
														
 
															+        retval = WaitForMultipleObjects(i, handles, FALSE, INFINITE);
														
 
															+        if (retval >= WAIT_OBJECT_0 && retval < (DWORD)(WAIT_OBJECT_0 + i)){
														
 
															+            hProcess = handles[retval - WAIT_OBJECT_0];
														
 
															+            free(handles);
														
 
															+            /* find this process again in the table */
														
 
															+            lua_pushnil(L);
														
 
															+            while (lua_next(L, -2)){
														
 
															+                proc = toproc(L, -1);
														
 
															+                if (proc && !proc->done && proc->hProcess == hProcess){
														
 
															+                    /* it's this one */
														
 
															+                    if (GetExitCodeProcess(proc->hProcess, &exitcode) == 0){
														
 
															+                        {
														
 
															+                            char buf[256];
														
 
															+                            copy_w32error(buf, 255, GetLastError());
														
 
															+                            fprintf(stderr, "GetExitCodeProcess failed: %s\n", buf);
														
 
															+                        }
														
 
															+                        proc->exitcode = -1; /*  :-\  */
														
 
															+                    } else {
														
 
															+                        proc->exitcode = exitcode;
														
 
															+                    }
														
 
															+                    CloseHandle(proc->hProcess);
														
 
															+                    doneproc(L, -1);
														
 
															+                    lua_pushinteger(L, exitcode);
														
 
															+                    lua_pushinteger(L, proc->pid); /* stack: list key proc exitcode pid */
														
 
															+                    return 3;
														
 
															+                }
														
 
															+                lua_pop(L, 1);
														
 
															+            }
														
 
															+            fputs("proc has mysteriously disappeared from table!\n", stderr);
														
 
															+            return 0;
														
 
															+        } else if (retval == WAIT_FAILED){
														
 
															+            free(handles);
														
 
															+            push_w32error(L, GetLastError());
														
 
															+            return lua_error(L);
														
 
															+        } else {
														
 
															+            free(handles);
														
 
															+            return luaL_error(L, "WaitForMultipleObjects failed unexpectedly");
														
 
															+        }
														
 
															+    } else {
														
 
															+        free(handles);
														
 
															+        lua_pushnil(L);
														
 
															+        lua_pushliteral(L, "no processes to wait for");
														
 
															+        return 2;
														
 
															+    }
														
 
															+#endif
														
 
															+}
														
 
															+
														
 
															+static const luaL_Reg subprocess[] = {
														
 
															+    /* {"pipe", superpipe}, */
														
 
															+    {"popen", superpopen},
														
 
															+    {"call", call},
														
 
															+    {"call_capture", call_capture},
														
 
															+    {"wait", superwait},
														
 
															+    {"prune", prune},
														
 
															+    {NULL, NULL}
														
 
															+};
														
 
															+
														
 
															+#define _DECL_FUNC(name,nparams,tycheck) {_SC(#name),  sq_subprocess_##name,nparams,tycheck}
														
 
															+static SQRegFunction sq_subprocess_methods[] =
														
 
															+{
														
 
															+    _DECL_FUNC(constructor,  -2, _SC("xsi")),
														
 
															+    _DECL_FUNC(popen,  1, _SC("x")),
														
 
															+    _DECL_FUNC(call,  1, _SC("x")),
														
 
															+    _DECL_FUNC(call_capture,  1, _SC("x")),
														
 
															+    _DECL_FUNC(prune,  1, _SC("x")),
														
 
															+    _DECL_FUNC(wait,  1, _SC("x")),
														
 
															+
														
 
															+    {0,0}
														
 
															+};
														
 
															+#undef _DECL_FUNC
														
 
															+
														
 
															+SQRESULT sq_register_subprocess(HSQUIRRELVM v)
														
 
															+{
														
 
															+    /* create environment table for C functions */
														
 
															+    lua_newtable(L);
														
 
															+    lua_pushvalue(L, -1);
														
 
															+    lua_setfield(L, LUA_REGISTRYINDEX, SP_LIST);
														
 
															+    lua_pop(L, 1);
														
 
															+
														
 
															+#if LUA_VERSION_NUM >= 502
														
 
															+    lua_createtable(L, 0, sizeof subprocess / sizeof *subprocess - 1);
														
 
															+    luaL_setfuncs(L, subprocess, 0);
														
 
															+#else
														
 
															+    luaL_register(L, "subprocess", subprocess);
														
 
															+#endif
														
 
															+
														
 
															+    /* export PIPE and STDOUT constants */
														
 
															+    lua_pushlightuserdata(L, &PIPE);
														
 
															+    lua_setfield(L, -2, "PIPE");
														
 
															+    lua_pushlightuserdata(L, &STDOUT);
														
 
															+    lua_setfield(L, -2, "STDOUT");
														
 
															+
														
 
															+    /* create metatable for proc objects */
														
 
															+    luaL_newmetatable(L, SP_PROC_META);
														
 
															+#if LUA_VERSION_NUM >= 502
														
 
															+    luaL_setfuncs(L, proc_meta, 0);
														
 
															+#else
														
 
															+    luaL_register(L, NULL, proc_meta);
														
 
															+#endif
														
 
															+    lua_pushboolean(L, 0);
														
 
															+    lua_setfield(L, -2, "__metatable");
														
 
															+    lua_pop(L, 1);
														
 
															+
														
 
															+    return 1;
														
 
															+}
														
 
															+
														
 
															+#endif