import java.io.BufferedReader;
import java.io.File;
import java.io.FileInputStream;
import java.io.IOException;
import java.io.InputStreamReader;
import java.text.DecimalFormat;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Comparator;
import java.util.HashMap;
import java.util.Set;
import java.util.Map.Entry;
/*
* 统计小说的字符
*/
public class CharCountDemo {
public static void main(String[] args) throws IOException{
File file = new File("c:/山楂树之恋.txt");
InputStreamReader reader = new InputStreamReader(new FileInputStream(file), "utf-8");
BufferedReader in = new BufferedReader(reader);
HashMap<Character,Integer> map = new HashMap<Character, Integer>();;
int count = 0;
int b;
while(true){
b = reader.read();
if(b==-1){
break;
}
if(b=='\r' || b=='\n' || b==' ' || b=='\t' || b==','){
continue;
}
count++;
Integer value = map.get((char)b);//查找map中是否已经有该字符。如果有则取出原来计数,否则返回一个null值。
if(value==null){
map.put((char)b, 1);
}else{
map.put((char)b, ++value);
}
}
in.close();
// 排序统计结果
Set<Entry<Character,Integer>> set = map.entrySet();
ArrayList<Entry<Character,Integer>> list = new ArrayList<Entry<Character,Integer>>(set);
Collections.sort(list, new Comparator<Entry<Character,Integer>>() {
public int compare(Entry<Character, Integer> o1,
Entry<Character, Integer> o2) {
return -(o1.getValue()-o2.getValue());
}
});
// 输出统计结果
System.out.println("count=" + count);
System.out.println("字数: " + list.size());
DecimalFormat fmt = new DecimalFormat("0.##%");
int n = 0;
for(Entry<Character,Integer> e : list){
System.out.println(e+"," + fmt.format(e.getValue()/(double)count));
if(++n==10)
break;
}
}
}