【发布时间】:2016-11-04 21:02:06
【问题描述】:
我想根据汽车的资质和价格对汽车进行分类。我应该用 MLP 来做,但是除了 XOR 示例之外没有任何其他示例。我有 6 个条件,我将它们变成双精度值,例如 vhigh 的 [1,0,0,0]。(条件在我链接的 uci 集中。)
这是我的 MLP 代码,我想用 uci 数据集 Dataset 对其进行训练,我该如何调整它以适应此代码?
编辑:让我更清楚一点,我并不是说除了 XOR 问题之外没有任何其他示例。我的意思是我需要一个输入集的示例,不像 [1,0] 我需要超过 2 个输入。
import java.io.FileInputStream;
import java.io.FileOutputStream;
import java.io.ObjectInputStream;
import java.io.ObjectOutputStream;
public class MultiLayerPerceptron implements Cloneable
{
protected double fLearningRate = 0.6;
protected Layer[] fLayers;
protected TransferFunction fTransferFunction;
public MultiLayerPerceptron(int[] layers, double learningRate, TransferFunction fun)
{
fLearningRate = learningRate;
fTransferFunction = fun;
fLayers = new Layer[layers.length];
for(int i = 0; i < layers.length; i++)
{
if(i != 0)
{
fLayers[i] = new Layer(layers[i], layers[i - 1]);
}
else
{
fLayers[i] = new Layer(layers[i], 0);
}
}
}
public double[] execute(double[] input)
{
int i;
int j;
int k;
double new_value;
double output[] = new double[fLayers[fLayers.length - 1].Length];
// Put input
for(i = 0; i < fLayers[0].Length; i++)
{
fLayers[0].Neurons[i].Value = input[i];
}
// Execute - hiddens + output
for(k = 1; k < fLayers.length; k++)
{
for(i = 0; i < fLayers[k].Length; i++)
{
new_value = 0.0;
for(j = 0; j < fLayers[k - 1].Length; j++)
new_value += fLayers[k].Neurons[i].Weights[j] * fLayers[k - 1].Neurons[j].Value;
new_value += fLayers[k].Neurons[i].Bias;
fLayers[k].Neurons[i].Value = fTransferFunction.evalute(new_value);
}
}
// Get output
for(i = 0; i < fLayers[fLayers.length - 1].Length; i++)
{
output[i] = fLayers[fLayers.length - 1].Neurons[i].Value;
}
return output;
}
public double backPropagateMultiThread(double[] input, double[] output, int nthread)
{
return 0.0;
}
public double backPropagate(double[] input, double[] output)
{
double new_output[] = execute(input);
double error;
int i;
int j;
int k;
/* doutput = correct output (output) */
for(i = 0; i < fLayers[fLayers.length - 1].Length; i++)
{
error = output[i] - new_output[i];
fLayers[fLayers.length - 1].Neurons[i].Delta = error * fTransferFunction.evaluteDerivate(new_output[i]);
}
for(k = fLayers.length - 2; k >= 0; k--)
{
//delta
for(i = 0; i < fLayers[k].Length; i++)
{
error = 0.0;
for(j = 0; j < fLayers[k + 1].Length; j++)
error += fLayers[k + 1].Neurons[j].Delta * fLayers[k + 1].Neurons[j].Weights[i];
fLayers[k].Neurons[i].Delta = error * fTransferFunction.evaluteDerivate(fLayers[k].Neurons[i].Value);
}
// success
for(i = 0; i < fLayers[k + 1].Length; i++)
{
for(j = 0; j < fLayers[k].Length; j++)
fLayers[k + 1].Neurons[i].Weights[j] += fLearningRate * fLayers[k + 1].Neurons[i].Delta *
fLayers[k].Neurons[j].Value;
fLayers[k + 1].Neurons[i].Bias += fLearningRate * fLayers[k + 1].Neurons[i].Delta;
}
}
// error
error = 0.0;
for(i = 0; i < output.length; i++)
{
error += Math.abs(new_output[i] - output[i]);
//System.out.println(output[i]+" "+new_output[i]);
}
error = error / output.length;
return error;
}
public boolean save(String path)
{
try
{
FileOutputStream fout = new FileOutputStream(path);
ObjectOutputStream oos = new ObjectOutputStream(fout);
oos.writeObject(this);
oos.close();
}
catch (Exception e)
{
return false;
}
return true;
}
public static MultiLayerPerceptron load(String path)
{
try
{
MultiLayerPerceptron net;
FileInputStream fin = new FileInputStream(path);
ObjectInputStream oos = new ObjectInputStream(fin);
net = (MultiLayerPerceptron) oos.readObject();
oos.close();
return net;
}
catch (Exception e)
{
return null;
}
}
public double getLearningRate()
{
return fLearningRate;
}
public void setLearningRate(double rate)
{
fLearningRate = rate;
}
public void setTransferFunction(TransferFunction fun)
{
fTransferFunction = fun;
}
public int getInputLayerSize()
{
return fLayers[0].Length;
}
public int getOutputLayerSize()
{
return fLayers[fLayers.length - 1].Length;
}
}
【问题讨论】:
-
在互联网上使用神经网络的例子有成百上千个。声称它们都是关于异或的,这是一个巨大的误解。
标签: java machine-learning neural-network perceptron