感知机算法的两种表示

 

 

感知机算法的原始形式

输入:训练数据集T={(x1,y1),(x2,y2),...,(xn,yn)},其中xi属于Rn(n维空间向量),yi={-1,+1},i=1,2,...,N

学习率t(0<t<=1);

输出:w,b;感知机模型f(x)=sign(w*x+b)

(1)选取初值w0,b0一般为 0

(2)在训练集中选取数据(xi,yi)

(3)如果yi(w*xi+b)<=0

                          w<---w+tyixi

                           b<----b+tyi

(4)转至(2),直至训练集中没有误分类点。

算法代码如下

复制代码
 1 import java.util.Random;
 2 import java.util.Scanner;
 3 import java.util.regex.Matcher;
 4 import java.util.regex.Pattern;
 5 
 6 //初始的感知机学习算法
 7 public class ganzhijiOriginal {
 8     //    数据集中数据的个数
 9     public static int NCount;
10     //    数据中每个数值的维数 不包含y
11     public static int N;
12     //    学习率  (0,1]
13     public static float t;
14 
15     //    保存数据
16     public static int datas[][];
17     //    权重向量
18     public static float w[];
19     //   偏移数据
20     public static float b;
21 
22     public static void main(String args[]) {
23         Scanner sca = new Scanner(System.in);
24 //       默认输入的格式为 N-t-b
25         System.out.println("输入格式为N-t-b-NCount的数据:");
26         String lines = sca.nextLine();
27         Pattern pattern = Pattern.compile("(.*)-(.*)-(.*)-(.*)");
28         Matcher matcher = pattern.matcher(lines);
29         matcher.find();
30         N = Integer.parseInt(matcher.group(1));
31         t = Float.parseFloat(matcher.group(2));
32         b = Float.parseFloat(matcher.group(3));
33 //        b = Integer.parseInt(matcher.group(3));
34         NCount = Integer.parseInt(matcher.group(4));
35 //        System.out.println("请输入权重向量的初始值格式为格式为x,x,x,x" + N);
36 //初始化数据集
37         w = new float[N];
38 //        lines = sca.nextLine();
39 //        String[] str = lines.split(",");
40 //        for (int i = 0; i < N; i++)
41 //            w[i] = Float.parseFloat(str[i]);
42         datas = new int[NCount][N + 1];
43         System.out.println("请输入所有权重向量的初始值");
44         for (int i = 0; i < NCount; i++) {
45             String line = sca.nextLine();
46             String strs[] = line.split(" ");
47             for (int j = 0; j <= N; j++)
48                 datas[i][j] = Integer.parseInt(strs[j]);
49         }
50         CountTheTimes = 0;
51         Random ra = new Random();
52         int chooseNumber = ra.nextInt(NCount);
53         CalcuteAndUpdatValue(0);
54         String strd = "";
55         for (int i = 0; i < N; i++)
56             strd += w[i] + "*x" + i + "+ ";
57         System.out.println("F(x)=sign(" + strd + b + ")");
58     }
59 
60     public static int CountTheTimes;
61 
62     private static void CalcuteAndUpdatValue(int chooseNumber) {
63         float f = isPOrN(chooseNumber);
64         boolean flages = f * datas[chooseNumber][N] > 0 ? true : false;
65         if (!flages) {
66             for (int j = 0; j < N; j++) //更新权重w的值
67                 w[j] = w[j] + t * datas[chooseNumber][N] * datas[chooseNumber][j];
68             b = b + t * datas[chooseNumber][N];
69 
70             CountTheTimes = 0;//初始化
71         } else {
72             CountTheTimes++;
73             chooseNumber = (chooseNumber + 1) % NCount;
74         }
75         if (CountTheTimes == NCount) return;
76         CalcuteAndUpdatValue(chooseNumber);
77     }
78 
79     private static float isPOrN(int chooseNumber) {
80         float sum = 0;
81         for (int i = 0; i < N; i++) sum += datas[chooseNumber][i] * w[i];
82         return sum + b;
83     }
84 
85 }
View Code
复制代码

 

感知机算法的对偶形式

输入:线性可分的数据集T={(x1,y1),(x2,y2),...,(xn,yn)}其中xi属于Rn(n维向量),yi属于{-1,+1},i,2,。。。,N;学习率为t (0<t<=1)

输出a,b 感知机模型f(x)=sign(j从1 到 ajyjxj*x累加  +b) 其中a=(a1,a2,a3...,an)T

(1)a<---0,b<----0

(2)在训练数据集中选择(xi,yi)

(3)如果 yi(j从1 到 ajyjxj*xi累加  +b)<=0

                  ai<----ai+t

                 b<---b+tyi

(4)转至(2)直到没有误分类点

算法如下

 

复制代码
import java.util.Random;
import java.util.Scanner;

//感知机算法的对偶形式
public class ganzhijiOudui {
    //存储数据的Gram矩阵
    public static int gramMatrix[][];
    //    存储初始点集合包括y
    public static int datas[][];
    //感知机中的学习率(0,1]
    public static float t;
    //    存储某个点更新的次数nt
    public static float a[];
    //    点的维度 不包含y
    public static int N;
    //    总点的数
    public static int NCount;
    //偏移量
    public static float b;

    public static int w[];//权重

    public static void main(String args[]) {
        Scanner sca = new Scanner(System.in);
        System.out.println("输入的格式为:N-t-b-NCount");
        String line = sca.nextLine();
        String dt[] = line.split("-");
        N = Integer.parseInt(dt[0]);
        t = Float.parseFloat(dt[1]);
        b = Float.parseFloat(dt[2]);
        NCount = Integer.parseInt(dt[3]);
        InitDatas(sca);


    }

    private static void InitDatas(Scanner sca) {
        datas = new int[NCount][N + 1];
        gramMatrix = new int[NCount][NCount];
        w = new int[N];
//        默认值为零
        a = new float[NCount];
        System.out.println("输入数据点集合格式为x x x ... Y");
        for (int i = 0; i < NCount; i++) {
            String line = sca.nextLine();
            String strs[] = line.split(" ");
            for (int j = 0; j <= N; j++) datas[i][j] = Integer.parseInt(strs[j]);
        }
        System.out.println("初始化Gram矩阵");
        for (int i = 0; i < NCount; i++) {
            for (int j = 0; j < NCount; j++) {
                gramMatrix[i][j] = MultiplyTheDatas(i, j);
            }
        }
//        记录总的循环次数
        TotalTimes = 0;
        Random random = new Random();
        int chooseNumber = random.nextInt(NCount);
        CalculateAndUpdatDatas(0);
        //更新 w
        for (int i = 0; i < N; i++) {
            int sum = 0;
            for (int j = 0; j < NCount; j++) sum += a[j] * datas[j][i]*datas[j][N];
            w[i] = sum;
        }
        String strd = "";
        for (int i = 0; i < N; i++)
            strd += w[i] + "*x" + i + "+ ";
        System.out.println("F(x)=sign(" + strd + b + ")");
    }

    public static int TotalTimes = 0;

    private static void CalculateAndUpdatDatas(int chooseNumber) {

        float sum = CaluteTheFx(chooseNumber);
        boolean flages = sum * datas[chooseNumber][N] > 0 ? true : false;
        if (!flages) {
            TotalTimes = 0;
            a[chooseNumber] = a[chooseNumber] + t;
            b = b + t * datas[chooseNumber][N];
        } else {
            TotalTimes++;
            chooseNumber = (chooseNumber + 1) % NCount;
        }
        if (TotalTimes == NCount) return;
        CalculateAndUpdatDatas(chooseNumber);
    }

    private static float CaluteTheFx(int chooseNumber) {

        float sum = 0;
        for (int i = 0; i <=N; i++) sum += a[i] * datas[i][N] * gramMatrix[i][chooseNumber];
        return sum + b;
    }


    //    计算两个向量的乘积
    private static int MultiplyTheDatas(int i, int j) {
        int sum = 0;
        for (int k = 0; k <N; k++) sum += datas[i][k] * datas[j][k];
        return sum;
    }


}
View Code
复制代码

 

posted @   张秀杰  阅读(617)  评论(0编辑  收藏  举报
点击右上角即可分享
微信分享提示