1109 综合实验:文件操作与字符处理
时间限制:4000MS 代码长度限制:10KB
提交次数:6265 通过次数:1646
题型: 填空题 语言: GCC
Description
在当前目录中存在文件名为"case1.in"(其中case后为数字1,不是字母l,写错提交后会判错)的文本文件, 其内容为一篇英文文章(以EOF作为结束标志)。现要求读取该文本文件内容,统计文章中每个单词出现的次数, 并输出出现次数最多的前5个单词及其出现次数(按出现次数由多到少的顺序输出,次数相同时按字典顺序输出, 不足5个单词时,按序输出全部单词)。程序中注意如下细节: (1) 空格、标点符号与回车符起到分隔单词的作用。 (2) 文章一行的末尾可能有连字符,出现连字符时,该行最末的字符串与下行最先出现的字符串构一个单词; (3) 名词缩写算一个单词; (4) 数字不算单词; (5) 单词不区分大小写; (6) 输出时单词全使用小写;
#include "stdio.h"
#include "math.h"
#include "string.h"
#include "stdlib.h"
_______________________
main()
{
_______________________
}
输入格式
文件case1.in中一篇英文文章,包含多段文字,单词数不超过10000,每个单词不超过20个字符
输出格式
按题意输出答案
输入样例
(如case1.in内容如下) I am a student. My school is SCAU. It is a beau- tiful university. I like it.
输出样例
a 2 i 2 is 2 it 2 am 1
#include <stdio.h>
#include <string.h>
struct word
{
char string[21];
int number;
};
word dictionary[10000];
int wordsNumber = 0;
void addWord(char word[21])
{
for (int i = 0; i < wordsNumber; i++)
if (strcmp(dictionary[i].string, word) == 0)
{
dictionary[i].number++;
return;
}
strcpy(dictionary[wordsNumber].string, word);
dictionary[wordsNumber].number = 1;
wordsNumber++;
}
void getMostFiveWordsAndPrint()
{
for (int i = 0; i < wordsNumber - 1; i++)
for (int j = 0; j < wordsNumber - 1 - i; j++)
if (dictionary[j].number < dictionary[j + 1].number || dictionary[j].number == dictionary[j + 1].number && strcmp(dictionary[j].string, dictionary[j + 1].string) > 0)
{
word t = dictionary[j];
dictionary[j] = dictionary[j + 1];
dictionary[j + 1] = t;
}
for (int i = 0; i < (wordsNumber >= 5 ? 5 : wordsNumber); i++)
printf("%s %d\n", dictionary[i].string, dictionary[i].number);
}
int main()
{
FILE *file;
if ((file = fopen("case1.in", "r")) == NULL)
exit(0);
char word[21], ch;
int n = 0;
while ((ch = fgetc(file)) != EOF)
{
if (!(ch >= 'a' && ch <= 'z' || ch >= 'A' && ch <= 'Z'))
{
if (n == 0)
continue;
else if (ch == '-')
{
ch = fgetc(file);
if (ch >= 'a' && ch <= 'z' || ch >= 'A' && ch <= 'Z')
{
word[n] = '\0';
addWord(strlwr(word));
n = 0;
word[n++] = ch;
continue;
}
else
{
if (ch == '\n')
{
while ((ch = fgetc(file)) == '\n')
;
while (ch >= 'a' && ch <= 'z' || ch >= 'A' && ch <= 'Z')
{
word[n++] = ch;
ch = fgetc(file);
}
}
word[n] = '\0';
addWord(strlwr(word));
n = 0;
continue;
}
}
else
{
word[n] = '\0';
addWord(strlwr(word));
n = 0;
continue;
}
}
word[n++] = ch;
}
fclose(file);
getMostFiveWordsAndPrint();
return 0;
}