如何找到文本中出现频率最高的词?

问题描述 投票:0回答:1

我有一个问题,如果我有这样的输入:"Thanks Thanks Thanks car car",输出会是 "thanks"。 "Thanks Thanks Thanks car car" 输出的是 "thanks". 如果我的单词以大写字母开头,它将以小写字母打印该单词。

 public class Main {
 public static void main(String[] args) throws IOException {
     String line;
     String[] words = new String[100];
     Map < String, Integer > frequency = new HashMap < > ();
     BufferedReader reader = new BufferedReader(new InputStreamReader(System.in));
     while ((line = reader.readLine()) != null) {
         line = line.trim();
         if (!line.isEmpty()) {
             words = line.split("\\W+");
             for (String word: words) {
                 String processed = word.toLowerCase();
                 processed = processed.replace(",", "");

                 if (frequency.containsKey(processed)) {
                     frequency.put(processed,
                         frequency.get(processed) + 1);
                 } else {
                     frequency.put(processed, 1);
                 }
             }
         }
     }
     int mostFrequentlyUsed = 0;
     String theWord = null;

     for (String word: frequency.keySet()) {
         Integer theVal = frequency.get(word);
         if (theVal > mostFrequentlyUsed) {
             mostFrequentlyUsed = theVal;
             theWord = word;
         } else if (theVal == mostFrequentlyUsed && word.length() <
             theWord.length()) {
             theWord = word;
             mostFrequentlyUsed = theVal;
         }

     }
     System.out.printf(theWord);
 }
java arrays string oop bufferedreader
1个回答
1
投票

为了让代码以输入的格式打印最常用的单词,而不是小写字母,你可以修改下面一行代码。

String processed = word.toLowerCase();

把它改成.NET。

String processed = word;

但要注意的是 containsKey() 方法是 区分大小写 并不会认为 "谢谢 "和 "感谢 "是同一个词。


0
投票
Please find the below program which print both upper and lower case based on input.

import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStreamReader;
import java.util.HashMap;
import java.util.Map;

 public class Main {
 public static void main(String[] args) throws IOException {

     BufferedReader reader = new BufferedReader(new InputStreamReader(System.in));
     String[] strArr=reader.readLine().split(" ");
     String result=null;
     int maxCount=0;
     Map<String, Integer> strMap=new HashMap<String, Integer>();
     int count=0;
     for(String s:strArr){
         count=0;
         if(strMap.containsKey(s)){
             count=strMap.get(s);
             strMap.put(s,++count);
         }else{
             strMap.put(s, ++count);
         }
     }  
         //find Maximum

         for(Map.Entry<String, Integer> itr: strMap.entrySet()){

             if(maxCount==0){                
                 maxCount=itr.getValue();
                 result=itr.getKey();                
             }else{

                 if(maxCount < itr.getValue()){                  
                     maxCount=itr.getValue();
                     result=itr.getKey();
                 }
             }   
         }

         // No of occurences with count
         System.out.println("word"+ result+"count"+ maxCount);

         printInLowerOrUpperCare(result);

 }

      public static void printInLowerOrUpperCare(String result){

          if(result.charAt(0) >='a' && result.charAt(0) >= 'z' ){

              System.out.println(result.toUpperCase());
          }else{
              System.out.println(result.toLowerCase());
          }           

      }

 }
© www.soinside.com 2019 - 2024. All rights reserved.