Untitled

// Ann.cpp : Defines the entry point for the console application.
//

#include "stdafx.h"
# include <cmath>
#include <math.h>
#include <vector>
#include <iostream>
#include <iomanip>
#include <fstream>
#include <string>
using namespace std;
//Generating random number: either 0 or 1, uniform distribution, for XOR operation. Can remove later if using data from files.
int randint();
struct Sample
{
	double input[2];
	double output[2];
	string ToString() {
		string str;
		str = "input: " + to_string(input[0]) + " " + to_string(input[1]) + " output: " + to_string(output[0]) + " " + to_string(output[1])+"\n";
		return str;
	}
};

class Data
{
public:
	int getNumberOfInputs() { return inputs; }
	int getNumberOfOutputs() { return outputs; }

	double *getInput(int index)
	{
		double *input = data[index].input;
		return input;
	}

	double *getOutput(int index)
	{
		double *output = data[index].output;
		return output;
	}

	int getNumberOfSamples() { return samples; }

	void addSample(Sample sample)
	{
		data.push_back(sample);
		samples++;
		//cout << sample.ToString();
	}

	void setSizes(int input_size, int output_size)
	{
		inputs = input_size;
		outputs = output_size;
	}

protected:
	std::vector<Sample> data;
	int inputs;
	int outputs;
	int samples = 0;
};

class XOR : public Data
{
public:
	void generate(int n)
	{
		for (int i = 0; i < n; i++)
		{
			double input1 = randint();
			double input2 = randint();
			double output1 = input1 == input2;
			double output2 = input1 != input2;
			addSample({ { input1, input2 },{ output1, output2 } });
		}
	}

	XOR()
	{
		inputs = 2;
		outputs = 2;
		samples = 0;
	}
	void printInputs(int index)
	{
		cout << index << " index inputs: " << endl;
		for (int i = 0; i < inputs; i++)
		{
			cout << getInput(index)[i] << " ";
		}
		cout << endl;
	}

	void printOutputs(int index)
	{
		cout << index << " index outputs: " << endl;
		for (int i = 0; i < outputs; i++)
		{
			cout << fixed << setprecision(2) << data[index].output[i] << " ";
		}
		cout << endl;
	}
};

struct Topology
{
	int L;//sluoksniu sk
	std::vector<int> l;//kiekiai sluoksnyje
} topolygy;

int kiek = 0;//for statistics - ignore
double f(double x);
double f_deriv(double x);
double gL(double a, double z, double t);
double gl(int layer_id, int w_i, int w_j, double *a_arr, double *z_arr, double *t_arr, double *w_arr, int *s,int *sw, int L, int *l);
double w_gradient(int layer_id, int w_i, int w_j, double *a_arr, double *z_arr, double *t_arr, double *w_arr,int *s, int *sw, int L, int *l);
double delta_w(double grad, double dw);

const double ETA = 0.1;
const double ALPHA = 0.5;

class AnnBase {
public:
	virtual void prepare(Topology top) = 0;
	virtual void init(Topology top, double w_arr_1[]) = 0;
	virtual void train(double *a, double *b) = 0;
	virtual void feedForward(double *a, double *b) = 0;//a and b temp vars for now.
	virtual void destroy() = 0;
};

class AnnSerialDBL : public AnnBase {
public:
	void prepare(Topology top);
	void init(Topology top, double w_arr_1[]);
	void train(double *a, double *b);
	void feedForward(double *a,double *b);
	void destroy();
public:
	int sum1;//temp var to keep the length of z, so z could be reset for calcs. Can adapt code later, so this could be removed
	int L;
	int * l;
	int * s;
	double * a_arr;
	double * z_arr;
	int * W;
	int * sw;
	double * w_arr;
	double * dw_arr;
	double * t_arr;
};
int main()
{
	topolygy.L = 5;
	topolygy.l.push_back(2);
	topolygy.l.push_back(5);
	topolygy.l.push_back(6);
	topolygy.l.push_back(7);
	topolygy.l.push_back(2);
	AnnSerialDBL labas;
	labas.prepare(topolygy);
	labas.init(topolygy, NULL);


	//****temp
	int sum = 0;
	for (int i = 0; i < labas.L; i++) {
		sum += topolygy.l.at(i) + 1;
	}
	//temp***


	XOR xo;
	xo.generate(60000);
	for (int i = 0; i < xo.getNumberOfSamples(); i++) {
		labas.train(xo.getInput(i), xo.getOutput(i));
	}


	//****temp
	for (int i = 0; i < sum; i++) {
	//	cout << labas.a_arr[i] << endl;
	}
	//******temp


	//Checking results(all combinations 0 and 1)
	for (double i = 0; i < 2;i++){
		for (double j = 0; j < 2; j++) {
			double input[] = {i ,j };
			double output[] = { 0,0 };
			labas.feedForward(input, output);

			cout << endl << "input : " << input[0] << "   " << input[1] << endl;
			cout << endl << "output: " << output[0] << "   " << output[1] << endl<<endl;
			cout << "---------------------------------------------------" << endl;
		}
	}

	//Checking results(all combinations 0 and 1)
	for (double i = 0; i < 1; i++) {
		double input[] = { randint()*1.0, randint()*1.0 };
		double output[] = { 0,0 };
		labas.feedForward(input, output);

		cout << endl << "input : " << input[0] << "   " << input[1] << endl;
		cout << endl << "output: " << output[0] << "   " << output[1] << endl << endl;
		cout << "---------------------------------------------------" << endl;
	}

	labas.destroy();

	int a;
	cout << kiek;
	cin >> a;

	return 0;
}

//returns random int, either 0 or 1
int randint() {
	double r = ((double)rand() / (RAND_MAX));
	int a = 0;
	if (r > 0.5) {
		a = 1;
	}
	else
	{
		a = 0;
	}
	return a;
}

void AnnSerialDBL::prepare(Topology top)
{
	l = new int[top.L];
	s = new int[top.L];

	int sum = 0;
	int mult = 0;
	for (int i = 0; i < top.L; i++) {
		sum += top.l.at(i) + 1;
	}
	sum1 = sum;
	for (int i = 0; i < top.L - 1; i++) {
		mult += (top.l.at(i) + 1)*top.l.at(i+1);
	}
	a_arr = new double[sum];
	z_arr = new double[sum];

	W = new int[top.L];
	sw = new int[top.L];

	w_arr = new double[mult];
	dw_arr = new double[mult];

	t_arr = new double[top.l.at(top.L - 1)];
}

void AnnSerialDBL::init(Topology top, double w_arr_1[] = NULL)
{
	L = top.L;
	//Neuronu kiekiai sluoksnyje
	for (int i = 0; i < top.L; i++) {
		l[i] = top.l.at(i) + 1;
	}

	//Sluoksniu pradzios indeksai
	for (int i = 0; i < top.L; i++) {
		s[i] = 0;
		for (int j = i; j > 0; j--) {
			s[i] += l[j - 1];
		}
	}

	//Bias neuronai
	for (int i = 0; i < top.L - 1; i++) {
		a_arr[s[i + 1] - 1] = 1;
	}

	//Svoriu kiekiai l-ame sluoksnyje
	for (int i = 0; i < top.L - 1; i++) {
		W[i] = l[i] * (l[i + 1] - 1);
		//cout << "Svoriu sk: " << W[i] << " Pradzios index: ";
		sw[i] = 0;
		if (i != 0) {
			for (int j = 0; j < i; j++) {
				sw[i] += W[j];
			}
		}
		if (w_arr_1 == NULL) {
			for (int j = 0; j < W[i]; j++) {
				w_arr[sw[i] + j] = (double)rand() / double(RAND_MAX);
				//cout << w_arr[sw[i] + j]<< endl;
				dw_arr[sw[i] + j] = 0;
			}
		}
		else {
			w_arr = w_arr_1; //ar reikia pokycius issisaugoti irgi?
		}

		//cout << sw[i] << " " << endl;
	}
}

void AnnSerialDBL::train(double *a,double *b)
{
	a_arr[0] = a[0];
	a_arr[1] = a[1];

	for (int j = 0; j < sum1; j++) {
		z_arr[j] = 0;
	}

	//FFEEED FORWARD
	for (int i = 0; i < L - 1; i++) {//per sluoksnius einu+
		for (int j = 0; j < l[i]; j++) { //kiek neuronu sluoksnyje+
			for (int k = 0; k < l[i + 1] - 1; k++) {//per sekancio sluoksnio z+
				z_arr[s[i + 1] + k] += w_arr[sw[i] + k + j*(l[i + 1] - 1)] * a_arr[s[i] + j];
				//cout << " w: "<< w_arr[sw[i] + k + j*(l[i + 1]-1)] << endl;
				//cout << "a: " << a_arr[s[i] + j] << endl;
				//cout << "z reiksmes: " << z_arr[s[i+1] + k] << endl;
				//cout << endl;
				kiek++;//temp
			}
		}
		for (int k = 0; k < l[i + 1] - 1; k++) {//per sekancio sluoksnio z
			a_arr[s[i + 1] + k] = f(z_arr[s[i + 1] + k]);
		//	cout << s[i + 1] + k << " a reiksmes: " << a_arr[s[i + 1] + k] << endl;
		}
	}

	t_arr[0] = b[0];
	t_arr[1] = b[1];

	//back propogation:
	for (int i = L-2; i >=0; i--) {//per sluoksnius
		for (int j = 0; j < l[i]; j++) {//per neuronus
			for (int k = 0; k < l[i + 1] - 1; k++) {//per kito sluoksnio neuronus
				dw_arr[sw[i] + k+j*(l[i + 1] - 1)] = delta_w(w_gradient(i, j, k, a_arr, z_arr, t_arr, w_arr, s,sw, L, l), dw_arr[sw[i] + k+ j*(l[i + 1] - 1)]);
				w_arr[sw[i] + k+ j*(l[i + 1] - 1)] += dw_arr[sw[i] + k+ j*(l[i + 1] - 1)];
			//	cout << w_arr[sw[i] + k] << " " << endl;
			}
		}
	}

}

void AnnSerialDBL::feedForward(double *a, double *b)
{
	a_arr[0] = a[0];
	a_arr[1] = a[1];

	for (int j = 0; j < sum1; j++) {
		z_arr[j] = 0;
	}
	//FFEEED FORWARD
	for (int i = 0; i < L - 1; i++) {//per sluoksnius einu+
		for (int j = 0; j < l[i]; j++) { //kiek neuronu sluoksnyje+
			for (int k = 0; k < l[i + 1] - 1; k++) {//per sekancio sluoksnio z+
				z_arr[s[i + 1] + k] += w_arr[sw[i] + k + j*(l[i + 1] - 1)] * a_arr[s[i] + j];
			//	cout << "w: "<< w_arr[sw[i] + k + j*(l[i + 1] - 1)] << endl;
			//	cout << "a: " << a_arr[s[i] + j] << endl;
			//	cout << "z reiksmes: " << z_arr[s[i+1] + k] << endl;
			//	cout << endl;
			}
		}
		for (int k = 0; k < l[i + 1] - 1; k++) {//per sekancio sluoksnio z
			a_arr[s[i + 1] + k] = f(z_arr[s[i + 1] + k]);
		//	cout << s[i + 1] + k << " a reiksmes: " << a_arr[s[i + 1] + k] << endl;
		}
	}

	//cout << a_arr[s[L - 1]];
	//cout << a_arr[s[L - 1]+1];
	if (a_arr[s[L - 1]] > a_arr[s[L - 1] + 1]) {
		b[0] = 1;
		b[1] = 0;
	}
	else {
		b[0] = 0;
		b[1] = 1;
	}
}

void AnnSerialDBL::destroy()
{
	delete l;
	l = NULL;
	delete s;
	s = NULL;

	delete a_arr;
	a_arr = NULL;
	delete z_arr;
	z_arr = NULL;

	delete W;
	W = NULL;
	delete sw;
	sw = NULL;

	delete w_arr;
	w_arr = NULL;
	delete dw_arr;
	dw_arr = NULL;

	delete t_arr;
	t_arr = NULL;
}

double f(double x) {
	double y = 1+exp(-x);
	//temp*********************
	if (y == 0) {
		cout << "Error 1";
	}
		if ((y-1) == 0) {
			//cout << "Error 2";
		}
	//temp**********************
	return 1 / y;
}


double f_deriv(double x) {
	//Temp**********
	double y = pow((1 + exp(-x)), 2);
	double z = exp(-x);
	if (y == 0) {
		cout << "Error 3";
	}
	if (z == 0) {
		cout << "Error 4";
	}
	//temp**********************
	return exp(-x) / pow((1 + exp(-x)), 2);
}

double gL(double a, double z, double t) {
	double w = f_deriv(z) * (a - t);
	//cout << "z: " << z << " a: " << a << " t: " << t << endl;
	return w;
}

double gl(int layer_id, int w_i, int w_j, double *a_arr, double *z_arr, double *t_arr, double *w_arr, int *s,int *sw, int L, int *l) {
	double w = f_deriv(z_arr[s[layer_id] + w_j]);
	double sum = 0;
	for (int i = 0; i < l[layer_id + 1] - 1; i++) {
		if (layer_id + 2 == L) {
			sum += w_arr[sw[layer_id] + i] * gL(a_arr[s[layer_id + 1] + i], z_arr[s[layer_id + 1]+ i], t_arr[i]);
		}
		else {
			sum += w_arr[sw[layer_id] + w_j] * gl(layer_id + 1, w_i, i, a_arr, z_arr, t_arr,w_arr, s, sw, L, l);
		}
	}
	return w*sum;
}

double w_gradient(int layer_id, int w_i, int w_j, double *a_arr, double *z_arr, double *t_arr, double *w_arr,int *s, int *sw, int L, int *l) {
	double w = a_arr[s[layer_id] + w_i];
	if (layer_id + 2 == L) {
		w *= gL(a_arr[s[layer_id + 1] + w_j], z_arr[s[layer_id + 1] + w_j], t_arr[w_j]);
	}
	else {
		w *= gl(layer_id + 1, w_i, w_j, a_arr, z_arr, t_arr, w_arr, s, sw, L, l);
	}
	//cout << L << endl;
	//cout << w << " layer id:"<< layer_id <<endl;
	return w;
}

double delta_w(double grad, double dw) {
	return (-ETA)*grad + ALPHA*dw;
}