?? targettext.java~22~

?? 基于樸素貝葉斯算法實現的中文文本分類程序。可以對中文文本進行分類識別

?? JAVA~22~

字號:

/** * <p>Title: </p> * <p>Description: </p> * <p>Copyright: Copyright (c) 2005</p> * <p>Company: </p> * @author not attributable * @version 1.0 */import java.io.*;import java.util.*;public class TargetText {  Dictionary newDict;  float []NB=new float[3];  int []NBE=new int[3];  public TargetText() {  }  public void init(Dictionary dict){    newDict=dict;    for(int i=0;i<3;i++){      NB[i]=1;      NBE[i]=0;    }  }  public void categorize(Sample []v,int n,String filename){    for(int i=0;i<n;i++){      fileSegment(filename,v[i].wordTable,i);    }    int temp=NBE[0];    int j=0;    for(int i=1;i<3;i++){      if(temp>NBE[i]){        temp=NBE[i];        j=i;      }    }    if(j==0){      System.out.println("This text belongs to science");    }else if(j==1){      System.out.println("This text belongs to sport");    }else if(j==2){      System.out.println("This text belongs to history");    }    //System.out.println(NB[0]+":"+NBE[0]+" "+NB[1]+":"+NBE[1]+" "+NB[2]+":"+NBE[2]);  }  public int wordSegment(String Sentence,HashMap hm,int n) {    int senLen = Sentence.length();    int i = 0, j = 0;    int M = 12;    String word;    boolean bFind = false;      while (i < senLen) {        int N = i + M < senLen ? i + M : senLen + 1;        bFind = false;        for (j = N - 1; j > i; j--) {          word = Sentence.substring(i, j);          if (newDict.Find(word)) {            if (j > i + 1) {              if (hm.containsKey(word)) {                NB[n]=NB[n]*((Float)hm.get(word)).floatValue();  //計算每一個類別的概率                while(NB[n]<1){                  NBE[n]=NBE[n]+1;                  NB[n]=NB[n]*10;                }              }            }            bFind = true;            i = j;            break;          }        }        if (bFind == false) {          i = j + 1;        }      }    return 1;  }  public void fileSegment(String fileName,HashMap hm,int n) { //按行讀入    try {      BufferedReader in = new BufferedReader(          new FileReader(fileName));      String s;      while ((s = in.readLine()) != null) {        wordSegment(s,hm,n);      }    }    catch (IOException e) {      System.out.println(e);    }  }}

?? 文件大小 311 K

?? 上傳用戶 zxyxwd6

?? 所屬分類人工智能/神經網絡

??? 相關標簽

#貝葉斯算法 #文本分類 #分類 #程序

?? 快捷鍵說明

復制代碼 Ctrl + C

搜索代碼 Ctrl + F

全屏模式 F11

切換主題 Ctrl + Shift + D

顯示快捷鍵 ?

增大字號 Ctrl + =

減小字號 Ctrl + -

亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频

?? targettext.java~22~

?? 快捷鍵說明