讀取JDK API文檔,並根據單詞出現頻率排序

1,拿到 API 文檔

登陸 https://docs.oracle.com/javase/8/docs/api/java

選中特定的類,而後 copy 其中的內容,api

1545827963474.png

放入 TXT 文件中 ,oracle

1545828104822.png

2,讀取TXT內容,並排序

package com.lgx.test;

import java.io.BufferedReader;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Collections;
import java.util.Comparator;
import java.util.List;
import java.util.Map;
import java.util.Map.Entry;
import java.util.Set;
import java.util.TreeMap;

public class ReadVectorAPI {

    public static String filename = "src/Vector.txt";
    public static StringBuffer sb = null;

    public static void main(String[] args) {
        try {
            //根據單詞字母排序
            countWordOrderByWord();
            //根據單詞頻率排序
            countWordOrderByCount();
        } catch (FileNotFoundException e) {
            e.printStackTrace();
        }
    }

    // 計算單詞的出現次數,依據單詞排序
    public static void countWordOrderByWord() throws FileNotFoundException {
        BufferedReader br = null;
        try {
            br = new BufferedReader(new FileReader(new File(filename)));
            String inputLine = null;
            TreeMap<String, Integer> map = new TreeMap<String, Integer>();
            while ((inputLine = br.readLine()) != null) {
                String[] words = inputLine.split("[ \n\t\r.,;:!?(){}]");
                for (int i = 0; i < words.length; i++) {
                    String key = words[i].toLowerCase();
                    if (key.length() > 0) {
                        if (map.get(key) == null) {
                            map.put(key, 1);
                        } else {
                            int times = map.get(key).intValue();
                            times++;
                            map.put(key, times);
                        }
                    }
                }
            }
            Set<Map.Entry<String, Integer>> entrySet = map.entrySet();
            System.out.println("=====根據單詞字母排序=====");
            for (Map.Entry<String, Integer> entry : entrySet) {
                System.out.println(entry.getKey() + " 在API文檔中出現了 " + entry.getValue() + " 次");
            }
        } catch (IOException e) {
            e.printStackTrace();
        }
    }

    // 計算單詞的出現次數,依據次數排序
    public static void countWordOrderByCount() throws FileNotFoundException {
        BufferedReader br = null;
        try {
            br = new BufferedReader(new FileReader(new File(filename)));
            String inputLine = null;
            TreeMap<String, Integer> map = new TreeMap<String, Integer>();
            while ((inputLine = br.readLine()) != null) {
                String[] words = inputLine.split("[ \n\t\r.,;:!?(){}]");
                for (int i = 0; i < words.length; i++) {
                    String key = words[i].toLowerCase();
                    if (key.length() > 0) {
                        if (map.get(key) == null) {
                            map.put(key, 1);
                        } else {
                            int times = map.get(key).intValue();
                            times++;
                            map.put(key, times);
                        }
                    }
                }
            }

            List<Map.Entry<String, Integer>> list = new ArrayList<Map.Entry<String, Integer>>(map.entrySet());
            Collections.sort(list, new Comparator<Map.Entry<String, Integer>>() {
                public int compare(Entry<String, Integer> o1, Entry<String, Integer> o2) {
                    return o2.getValue().compareTo(o1.getValue());
                }
            });
            System.out.println("=====根據單詞頻率排序=====");
            for (Map.Entry<String, Integer> mapping : list) {
                System.out.println(mapping.getKey() + " 在API文檔中出現了 " + mapping.getValue() + " 次");
            }
        } catch (IOException e) {
            e.printStackTrace();
        }
    }
}

輸出結果前部分截圖爲;app

1545828218319.png

相關文章
相關標籤/搜索