Java语言实现朴素贝叶斯算法

亚丁号

于 2024-08-22 09:36:28 发布

阅读量195

点赞数 4

文章标签： java 算法 python

本文链接：https://blog.csdn.net/zy0412326/article/details/141416946

版权

朴素贝叶斯算法是一种基于贝叶斯定理的简单但非常有效的分类算法。它假设特征之间是独立的，这就是“朴素”这个词的由来。下面是一个用Java实现朴素贝叶斯分类器的示例。

import java.util.HashMap;
import java.util.Map;
import java.util.Set;
public class NaiveBayesClassifier {
    private Map<String, Map<String, Integer>> featureCountPerLabel;
    private Map<String, Integer> labelCount;
    private int totalSamples;

    public NaiveBayesClassifier() {
        featureCountPerLabel = new HashMap<>();
        labelCount = new HashMap<>();
        totalSamples = 0;
    }

    public void train(String[] features, String label) {
        labelCount.put(label, labelCount.getOrDefault(label, 0) + 1);
        for (String feature : features) {
            featureCountPerLabel.putIfAbsent(label, new HashMap<>());
            Map<String, Integer> featureCount = featureCountPerLabel.get(label);
            featureCount.put(feature, featureCount.getOrDefault(feature, 0) + 1);
        }
        totalSamples++;
    }

    public String predict(String[] features) {
        String bestLabel = null;
        double bestProbability = Double.NEGATIVE_INFINITY;

        for (String label : labelCount.keySet()) {
            double logProbability = Math.log(labelCount.get(label) / (double) totalSamples);

            for (String feature : features) {
                int featureCount = featureCountPerLabel.getOrDefault(label, new HashMap<>()).getOrDefault(feature, 0);
                logProbability += Math.log((featureCount + 1.0) / (labelCount.get(label) + featureCountPerLabel.size()));
            }

            if (logProbability > bestProbability) {
                bestProbability = logProbability;
                bestLabel = label;
            }
        }

        return bestLabel;
    }
}

测试分类器

public class NaiveBayesExample {
    public static void main(String[] args) {
        NaiveBayesClassifier classifier = new NaiveBayesClassifier();

        // 训练数据集
        classifier.train(new String[]{"sunny", "hot", "high", "false"}, "no");
        classifier.train(new String[]{"sunny", "hot", "high", "true"}, "no");
        classifier.train(new String[]{"overcast", "hot", "high", "false"}, "yes");
        classifier.train(new String[]{"rainy", "mild", "high", "false"}, "yes");
        classifier.train(new String[]{"rainy", "cool", "normal", "false"}, "yes");
        classifier.train(new String[]{"rainy", "cool", "normal", "true"}, "no");
        classifier.train(new String[]{"overcast", "cool", "normal", "true"}, "yes");
        classifier.train(new String[]{"sunny", "mild", "high", "false"}, "no");
        classifier.train(new String[]{"sunny", "cool", "normal", "false"}, "yes");
        classifier.train(new String[]{"rainy", "mild", "normal", "false"}, "yes");
        classifier.train(new String[]{"sunny", "mild", "normal", "true"}, "yes");
        classifier.train(new String[]{"overcast", "mild", "high", "true"}, "yes");
        classifier.train(new String[]{"overcast", "hot", "normal", "false"}, "yes");
        classifier.train(new String[]{"rainy", "mild", "high", "true"}, "no");

        // 预测
        String[] newSample = {"sunny", "cool", "high", "true"};
        String prediction = classifier.predict(newSample);
        System.out.println("Predicted class: " + prediction);
    }
}