哈夫曼编码/译码器
【问题描述】
利用哈夫曼编码进行信息通讯可以大大提高信道利用率,缩短信息 传输时间,降低传输成本。但是,这要求在发送端通过一个编码系统对 待传数据预先编码;在接收端将传来的数据进行译码(复原)。对于双 工信道(即可以双向传输信息的信道),每端都需要一个完整的编/译码 系统。试为这样的信息收发站写一个哈夫曼码的编译码系统。
vs2017环境
【基本要求】
一个完整的系统应具有以下功能:
(1)I:初始化(Initialization):从终端读入字符集大小n,及n个 字符和n个权值,建立哈夫曼树,并将它存于文件hfmtree中。
(2)C:编码(Coding ):利用已建好的哈夫曼树(如不在内存, 则从文件hfmtree中读入),对文件tobetrans中的正文进行编码,然后 将结果存入文件codefile中。
(3)D:译码(Decoding):利用已建好的哈夫曼树将文件codefile 中的代码进行译码,结果存入文件textfile中。
(4)P:打印代码文件(Print):将文件codefile以紧凑格式显示在终端 上,每行50个代码。同时将此字符形式的编码文件写入文件codeprint中。
(5)T:打印哈夫曼树(Tree printing):将已在内存中的哈夫曼树以 直观的方式(树或凹入表形式)显示在终端上,同时将此字符形式的哈夫 曼树写入文件treeprint中。
【测试数据】
(1)已知某系统在通信联络中只可能出现八种字符,其频率分别为 0.05,0.29,0.07,0.08,0.14,0.23,0.03,0.11,试设计哈夫曼编码。
(2)实现以下报文的编码和译码:“THIS PROGRAM IS MY FAVORITE”。
【实现提示】
(1)用户界面可以设计为“菜单”方式:显示上述功能符号,再加上 “E”,表示结束运行End,请用户键入一个选择功能符。此功能执行完毕 后再显示此菜单,直至某次用户选择了“E”为止。
(2)程序的一次执行过程中,第一次执行I、D或C命令之后,哈夫曼 树已经在内存了,不必再读入。每次执行中不一定执行I命令,因为文件 hfmtree可能早已建好。
【代码实现】
haffman.h
#define MaxValue 32767
#define MaxNode 10000
#include<iostream>
#include<fstream>
#include<string>
#include<iomanip>
typedef struct {
char data;
int weight;
int flag;
int parent;
int leftChild;
int rightChild;
}HaffNode;
typedef struct {
char bit[MaxNode];
int start;
int weight;
char data;
}Code;
void Haffman(int weight[], char str[], int n, HaffNode haffTree[])
{
int i, j, m1, m2, x1, x2;
for (i = 0; i < 2 * n - 1; i++) {
if (i < n) {
haffTree[i].weight = weight[i];
haffTree[i].data = str[i];
}
else {
haffTree[i].weight = 0;
haffTree[i].data = '0';
}
haffTree[i].parent = -1;
haffTree[i].flag = 0;
haffTree[i].leftChild = -1;
haffTree[i].rightChild = -1;
}
for (i = 0; i < n - 1; i++) {
m1 = m2 = MaxValue;
x1 = x2 = 0;
for (j = 0; j < n + i; j++) {
if (haffTree[j].weight < m1&&haffTree[j].flag == 0) {
m2 = m1;
x2 = x1;
m1 = haffTree[j].weight;
x1 = j;
}
else if (haffTree[j].weight < m2&&haffTree[j].flag == 0)
{
m2 = haffTree[j].weight;
x2 = j;
}
}
haffTree[x1].parent = n + i;
haffTree[x2].parent = n + i;
haffTree[x1].flag = haffTree[x2].flag = 1;
haffTree[n + i].weight = haffTree[x1].weight + haffTree[x2].weight;
haffTree[n + i].leftChild = x1;
haffTree[n + i].rightChild = x2;
}
}
void HaffmanCode(HaffNode haffTree[], int n, Code haffCode[])
{
Code *cd = (Code *)malloc(sizeof(Code));
int i, j, child, parent;
for (i = 0; i < n; i++) {
cd->start = n - 1;
cd->weight = haffTree[i].weight;
cd->data = haffTree[i].data;
child = i;
parent = haffTree[child].parent;
while (parent != -1) {
if (haffTree[parent].leftChild == child)
cd->bit[cd->start] = '0';
else
cd->bit[cd->start] = '1';
cd->start--;
child = parent;
parent = haffTree[child].parent;
}
for (j = cd->start + 1; j < n; j++)
haffCode[i].bit[j] = cd->bit[j];
haffCode[i].bit[j] = '\0';
haffCode[i].start = cd->start + 1;
haffCode[i].weight = cd->weight;
haffCode[i].data = cd->data;
}
}
haffman.cpp
#include<iostream>
#include<iomanip>
#include<cstdio>
#include<cstdlib>
#include<cstring>
#include<string>
#include<fstream>
#include"Haffman.h"
using namespace std;
ifstream input_file;
ofstream output_file;
int n, m = 0;
HaffNode *myHaffTree = (HaffNode *)malloc(sizeof(HaffNode)*(2 * MaxNode - 1));
Code *myHaffCode = (Code *)malloc(sizeof(Code)*MaxNode);
void Initialization() {
char str[MaxNode];
int weight[MaxNode];
cout << "请输入字符个数:" << endl;
cin >> n;
for (int i = 0; i < n; i++) {
cout << "请输入第" << i + 1 << "个字符以及相应的权值" << endl;
cin >> str[i] >> weight[i];
}
Haffman(weight, str, n, myHaffTree);
HaffmanCode(myHaffTree, n, myHaffCode);
for (int i = 0; i < n; i++) {
cout << myHaffCode[i].data << ": ";
for (int j = myHaffCode[i].start; j < n; j++) {
cout << myHaffCode[i].bit[j];
}
cout << endl;
}
output_file.open("hfmTree.txt");
if (!output_file) {
cout << "can't open file !" << endl;
return;
}
for (int i = 0; i < n; i++) {
output_file << "(" << myHaffTree[i].data << myHaffTree[i].weight << ")" << endl;
}
output_file.close();
cout << "哈夫曼树已创建完成,并且已放入hfmTree.txt中." << endl;
cout << endl << endl;
}
void Coding() {
cout << "请输入字符或字符串:" << endl;
string str;
string code;
cin >> str;
output_file.open("tobetran.txt");
if (!output_file) {
cout << "不能打开文件 !" << endl;
return;
}
output_file << str;
output_file.close();
output_file.open("codefile.txt");
if (!output_file) {
cout << "不能打开文件 !" << endl;
return;
}
for (int i = 0; i < str.size(); i++) {
for (int j = 0; j < n; j++) {
if (myHaffTree[j].data == str[i]) {
for (int k = myHaffCode[j].start; k < n; k++) {
output_file << myHaffCode[j].bit[k];
}
break;
}
}
}
output_file.close();
cout << "编码完毕,并且已经存入codefile.txt中!" << endl;
input_file.open("codefile.txt");
if (!input_file) {
cout << "不能打开文件 !" << endl;
return;
}
input_file >> code;
cout << "编码码值为:" << endl;
cout << code << endl;
input_file.close();
cout << endl << endl;
}
void Decoding() {
char s[MaxNode], s1[MaxNode];
int i, j, k, l, p;
input_file.open("codefile.txt");
if (!input_file) {
cout << "不能打开文件 !" << endl;
return;
}
input_file >> s;
input_file.close();
output_file.open("textfile.txt");
if (!output_file) {
cout << "不能打开文件 !" << endl;
return;
}
k = 0;
while (s[k] != '\0') {
for (i = 0; i < n; i++) {
l = k;
for (j = 0; j < strlen(myHaffCode[i].bit) - myHaffCode[i].start; j++, l++) {
s1[j] = s[l];
}
s1[j] = '\0';
for (p = myHaffCode[i].start, j = 0; p < n; p++, j++)
if (myHaffCode[i].bit[p] != s1[j]) break;
if (p == n) {
output_file << myHaffTree[i].data;
k += strlen(myHaffCode[i].bit) - myHaffCode[i].start;
break;
}
}
}
output_file.close();
input_file.open("textfile.txt");
if (!input_file) {
cout << "不能打开文件 !" << endl;
return;
}
input_file >> s;
cout << s << endl;
input_file.close();
cout << "译码结束,字符已经存入当前目录下 --> textfile.txt 文件中!" << endl;
cout << endl << endl;
}
void Print() {
char s[MaxNode], s1[MaxNode];
int i, j, k, l, p;
input_file.open("codefile.txt");
if (!input_file) {
cout << "不能打开文件 !" << endl;
return;
}
input_file >> s;
int icount = 0;
for (int i = 1; i < strlen(s) + 1; i++) {
cout << s[i - 1];
if (i % 50 == 0) cout << endl;
}
cout << endl;
input_file.close();
output_file.open("codeprint.txt");
k = 0;
while (s[k] != '\0') {
for (i = 0; i < n; i++) {
l = k;
for (j = 0; j < strlen(myHaffCode[i].bit) - myHaffCode[i].start; j++, l++) {
s1[j] = s[l];
}
s1[j] = '\0';
for (p = myHaffCode[i].start, j = 0; p < n; p++, j++)
if (myHaffCode[i].bit[p] != s1[j]) break;
if (p == n) {
output_file << myHaffTree[i].data;
k += strlen(myHaffCode[i].bit) - myHaffCode[i].start;
break;
}
}
}
output_file.close();
cout << "字符形式的编码文件写入当前目录下 --> codeprint中!" << endl;
cout << endl << endl;
}
void TreePrinting(HaffNode *myHaffTree1, HaffNode *myHaffTree2, int m) {
if (myHaffTree1 != myHaffTree2 - 1)
{
if (m)output_file.close();
output_file.open("treeprint.txt");
if (!output_file) {
cout << "不能打开文件 !" << endl;
return;
}
TreePrinting(myHaffTree2 + myHaffTree1->rightChild, myHaffTree2, m + 1);
cout << setw(4 * m) << myHaffTree1->weight << endl;
output_file << myHaffTree1->weight << endl;
TreePrinting(myHaffTree2 + myHaffTree1->leftChild, myHaffTree2, m + 1);
output_file.close();
}
}
int main() {
char ch;
while (1) {
cout << " *******************哈夫曼编/译码器****************" << endl;
cout << " *** I---初始化" << " C---编码 ***" << endl;
cout << " *** D---解码" << " P---打印 ***" << endl;
cout << " *** T---打印树" << " E---退出 ***" << endl;
cout << " ------------------------------------------" << endl;
cout << "请选择功能键:" << endl;
cin >> ch;
if (ch == 'I'|| ch=='i')
// 用户选择 初始化
Initialization();
else if (ch == 'C' || ch == 'c')
// 用户选择 编码
Coding();
else if (ch == 'D' || ch == 'd')
// 用户选择 解码
Decoding();
else if (ch == 'P' || ch == 'p')
// 用户选择 打印
Print();
else if (ch == 'T' || ch == 't') {
// 用户选择 打印树
TreePrinting(myHaffTree + 2 * n - 2, myHaffTree, 0);
cout << "此字符形式的哈夫曼树已写入当前目录下 --> treeprint中" << endl;
cout << endl << endl;
}
else if (ch == 'E')
// 用户选择 退出
break;
else
// 用户输入不合法 提示重新输入
cout << "不存在,请重新选择 !" << endl;
}
return 0;
}