具体代码如下:
#include <iostream>
#include <string>
#include <ctype.h>
#define N 50
typedef struct BiTNode
{
char data[N];
int count;
struct BiTNode *lChild;
struct BiTNode *rChild;
}BiTNode,*BiTree;
int GetWord(int start,int end,char* pBuf,char* word); //词汇
void CreateSearchTree(char* item,BiTree& T); //创建二叉树进行查找
void InOrderAndPrint(BiTree T,FILE* pf); //进行中序遍历查找并写入文件
int sum=0;
char temp1[N];
char temp2[N];
int main()
{ while(1){
//获取输入文件名
char fileName[30];
memset(fileName,0,sizeof(fileName));
printf("请输入查找的文件名(例:example.txt): ");
scanf("%s",fileName);
//打开需要统计词汇的文件
FILE* pf;
pf=fopen(fileName,"rb");
if(pf==NULL)
{
printf("找不到文件!无法打开文件\n");
return false;
}
printf("* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * \n");
printf("成功打开文件--- %s !\n\n",fileName);
printf("* * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * * \n");
printf("原文内容为:\n");
//读取文件
fseek(pf,0,SEEK_END);
int len=ftell(pf);
rewind(pf);
char *pBuf=new char[len+1];
pBuf[len]=0;
fread(pBuf,1,len,pf);
fclose(pf);
//读取单词
printf("%s\n",pBuf);
printf("*****************************************************************************\n\n");
printf("将统计写入文件(如:1.txt )\n");
int i=0;
char word[N];
BiTree T=NULL;
while(i<len)
{
i=GetWord(i,len,pBuf,word);
if(strlen(word)==0)
{
break;
}
CreateSearchTree(word,T);
}
//写入文件并显示在屏幕上
memset(fileName,0,sizeof(fileName));
printf("请输入写出文件名 : ");
scanf("%s",fileName);
pf=fopen(fileName,"w");
if(pf==NULL)
{
printf("不能写入文件!");
return false;
}
printf("******************************************************************************\n");
fprintf(pf,"\t\t词频统计结果: \n");
printf("\t\t词频统计结果:\n");
fprintf(pf,"*********************************************************\n");
InOrderAndPrint(T,pf);
fprintf(pf,"*********************************************************\n");
fprintf(pf,"这篇文章单词总数: %d\n",sum);
printf("这篇文章单词总数:%d\n",sum);
fclose(pf);
printf("******************************************************************************\n");
printf("统计结果写入文件 --- %s !\n\n",fileName);
}
return 0;
}
//词汇
int GetWord(int start,int end,char* pBuf,char* word)
{
int i;
int j=0;
memset(word,0,sizeof(char));
for(i=start;i<end;i++)
{
if(isalpha(pBuf[i]))
{
word[j]=pBuf[i];
j++;
}
else
{
if(j==0)
{
continue;
}
word[j]='\0';
j=0;
sum++;
break;
}
}
return i;
}
//创建二叉树进行查找
void CreateSearchTree(char* item,BiTree& T)
{
strcpy(temp1,item);
temp1[0]=tolower(item[0]);
if(T==NULL)
{
T=(BiTree)malloc(sizeof(BiTNode));
strcpy(T->data,item);
T->count=1;
T->lChild=NULL;
T->rChild=NULL;
}
else
{
strcpy(temp2,T->data);
temp2[0]=tolower(T->data[0]);
if(strcmp(temp1,temp2)==-1)
{
CreateSearchTree(item,T->lChild);
}
else if(strcmp(temp1,temp2)==1)
{
CreateSearchTree(item,T->rChild);
}
else
{
T->count++;
}
}
}
//进行中序遍历查找并写入文件
void InOrderAndPrint(BiTree T,FILE* pf)
{
if(T!=NULL)
{
InOrderAndPrint(T->lChild,pf);
fprintf(pf,"出现的词汇:%-30s 频率:%-9d\t\n",T->data,T->count);
printf("出现的词汇:%-30s 频率:%-9d\t\n",T->data,T->count);
InOrderAndPrint(T->rChild,pf);
}
}