1、主要数据类型与变量
1.1使用到的头文件
#include <iostream>
#include <cstdio>
#include <cstring>
#include <algorithm>
#include <map>
#include <queue>
#include <string>
#include <iterator>
#include <fstream>
1.2 使用类代替结构体,这里重载比较运算符,便于排序和构造优先队列。
class HTNode{
public:
char ch
;
int weight
;
HTNode
*left
;
HTNode
*right
;
HTNode(int weight
) : weight(weight
) {}
bool operator<(const HTNode
&htnode
) const{
return weight
> htnode
.weight
;
}
HTNode(char ch
, int weight
, HTNode
*left
, HTNode
*right
) : ch(ch
), weight(weight
), left(left
), right(right
) {}
HTNode(char ch
, int weight
) : ch(ch
), weight(weight
) {}
};
1.3函数结构说明
void CreateHuffmanTree(priority_queue
<HTNode
> &queue
);
priority_queue
<HTNode
> count(string s
);
void show(priority_queue
<HTNode
> q
);
string
readFile(string path
);
void writeFile(string path
,string data
);
void writeFile(string path
,char data
);
static map
<char,string
> huffmanCode
;
void getCodes(HTNode
*root
,string code
,string
&prefix
);
void printCode(map
<char,string
> codes
);
string
BecomeCode(map
<char,string
> codetTable
,string data
);
void deCode(map
<char,string
> codetTable
,string CodeData
);
2、算法或程序模块
2.1 程序流程解释: ①创建赫夫曼树:统计字符的频率由小到大放入优先队列,通过队列找出最小频率构建赫夫曼树。 ②生成赫夫曼编码和赫夫曼编码后的数据:通过递归遍历赫夫曼树,通过Map集合创建编码表,再使用编码表和源数据生成编码后的数据。 ③使用赫夫曼编码解码:通过查找编码后的数据配合编码表,通过查找方式输出对应的字符 核心函数解释 构造赫夫曼树:最小左右孩子的权重相加,生成父节点,然后父节点进队列
void CreateHuffmanTree(priority_queue
<HTNode
> &queue
){
while (queue
.size()>1){
HTNode
*left
= new HTNode(queue
.top()); queue
.pop();
HTNode
*right
= new HTNode(queue
.top()); queue
.pop();
HTNode
parent('R',left
->weight
+ right
->weight
,left
,right
);
queue
.push(parent
);
}
}
统计每个字符出现的频率:字符范围是ASCALL
:0-128
priority_queue
<HTNode
> count(string s
){
int a
[128] = {0};
priority_queue
<HTNode
> queue
;
for (int i
= 0; i
< s
.length();i
++) {
if (s
[i
] >= 0 && s
[i
] <= 127) { a
[s
[i
]]++; }
}
for (int i
= 0; i
< 128;i
++) {
if (a
[i
]!=0){
HTNode
*htNode
= new HTNode((char)i
,a
[i
]);
queue
.push(*htNode
);
}
}
return queue
;
}
这里使用了二叉树的DFS方法,进行递归搜索叶子节点,然后存入map编码表中
void getCodes(HTNode
*root
,string code
,string
&prefix
){
string s
=prefix
;
s
.append(code
);/通过append方法连接该节点的路径
if(root
){
if (root
->ch
==82){
getCodes(root
->left
,"0",s
);
getCodes(root
->right
,"1",s
);
}else{如果是叶子节点
huffmanCode
[root
->ch
] = s
;
}
}
}
编码:字符串的append追加函数来连接源数据对应的编码表
解码:双层循环移动指针来截取字符串,然后找到对应的编码表,输出字符到文件中
string
BecomeCode(map
<char,string
> codetTable
,string data
){
string res
="";
for (int i
= 0; i
< data
.length(); ++i
) {
res
.append(codetTable
[data
[i
]]);
}
...
}
void deCode(map
<char,string
> codetTable
,string CodeData
){
......
for (int i
= 0; i
< CodeData
.length(); ++i
) {
for (int j
= 0; j
< 10; ++j
) {
sub
= CodeData
.substr(i
,j
);
it
= codetTable
.begin();
while(it
!= codetTable
.end()){
if(sub
== it
->second
){
char s
= it
->first
;
cout
<<s
;
writeFile("D:\\解码文件.txt",s
);
i
= j
+ i
;
j
= 0;
break;
}
++it
;
......
通过路径读文件和写文件
string
readFile(string path
){
ifstream ifs
;
ifs
.open(path
,ios
::in
);
if (!ifs
.is_open())
{
cout
<< "文件打开失败" << endl
;return "";
}
string res
;
while (getline(ifs
, res
))
{
cout
<<"读取的信息为: "<< res
<< endl
;
}
ifs
.close();
return res
;
}
void writeFile(string path
,string data
)
{
ofstream
ofs(path
, ios
::out
);
ofs
<<data
<<endl
;
ofs
.close();
}
主程序main函数
int main(){
string s
= readFile("D:\\源文件.txt");
priority_queue
<HTNode
> queue
= count(s
);
show(queue
);
CreateHuffmanTree(queue
);
string bulid
="";
HTNode root
= queue
.top();
getCodes(&root
,"",bulid
);
printCode(huffmanCode
);
string res
= BecomeCode(huffmanCode
,s
);
writeFile("D:\\编码文件.txt",res
);
deCode(huffmanCode
,res
);
return 0;
}.
程序源代码
#include <iostream>
#include <cstdio>
#include <cstring>
#include <algorithm>
#include <map>
#include <queue>
#include <string>
#include <iterator>
#include <fstream>
using namespace std
;
class HTNode{
public:
char ch
;
int weight
;
HTNode
*left
;
HTNode
*right
;
HTNode(int weight
) : weight(weight
) {}
bool operator<(const HTNode
&htnode
) const{
return weight
> htnode
.weight
;
}
HTNode(char ch
, int weight
, HTNode
*left
, HTNode
*right
) : ch(ch
), weight(weight
), left(left
), right(right
) {}
HTNode(char ch
, int weight
) : ch(ch
), weight(weight
) {}
};
void CreateHuffmanTree(priority_queue
<HTNode
> &queue
);
priority_queue
<HTNode
> count(string s
);
void show(priority_queue
<HTNode
> q
);
string
readFile(string path
);
void writeFile(string path
,string data
);
void writeFile(string path
,char data
);
static map
<char,string
> huffmanCode
;
void getCodes(HTNode
*root
,string code
,string
&prefix
);
void printCode(map
<char,string
> codes
);
string
BecomeCode(map
<char,string
> codetTable
,string data
);
void deCode(map
<char,string
> codetTable
,string CodeData
);
void CreateHuffmanTree(priority_queue
<HTNode
> &queue
){
while (queue
.size()>1){
HTNode
*left
= new HTNode(queue
.top()); queue
.pop();
HTNode
*right
= new HTNode(queue
.top()); queue
.pop();
HTNode
parent('R',left
->weight
+ right
->weight
,left
,right
);
queue
.push(parent
);
}
}
priority_queue
<HTNode
> count(string s
){
int a
[128] = {0};
priority_queue
<HTNode
> queue
;
for (int i
= 0; i
< s
.length();i
++) {
if (s
[i
] >= 0 && s
[i
] <= 127) { a
[s
[i
]]++; }
}
for (int i
= 0; i
< 128;i
++) {
if (a
[i
]!=0){
HTNode
*htNode
= new HTNode((char)i
,a
[i
]);
queue
.push(*htNode
);
}
}
return queue
;
}
void show(priority_queue
<HTNode
> q
){
while(!q
.empty()){
HTNode node
= q
.top(); q
.pop();
cout
<<node
.ch
<<": "<<node
.weight
<<endl
;
}
}
void getCodes(HTNode
*root
,string code
,string
&prefix
){
string s
=prefix
;
s
.append(code
);
if(root
){
if (root
->ch
==82){
getCodes(root
->left
,"0",s
);
getCodes(root
->right
,"1",s
);
}else{
huffmanCode
[root
->ch
] = s
;
}
}
}
void printCode(map
<char,string
> codes
){
map
<char,string
>::const_iterator it
= codes
.begin();
while(it
!= codes
.end()){
cout
<<"符号: "<<it
->first
<<"编码:"<<it
->second
<<endl
;
++it
;
}
}
string
BecomeCode(map
<char,string
> codetTable
,string data
){
string res
="";
for (int i
= 0; i
< data
.length(); ++i
) {
res
.append(codetTable
[data
[i
]]);
}
return res
;
}
void deCode(map
<char,string
> codetTable
,string CodeData
){
map
<char,string
>::const_iterator it
;
string sub
="";
for (int i
= 0; i
< CodeData
.length(); ++i
) {
for (int j
= 0; j
< 10; ++j
) {
sub
= CodeData
.substr(i
,j
);
it
= codetTable
.begin();
while(it
!= codetTable
.end()){
if(sub
== it
->second
){
char s
= it
->first
;
cout
<<s
;
writeFile("解码文件.txt",s
);
i
= j
+ i
;
j
= 0;
break;
}
++it
;
}
}
}
}
string
readFile(string path
){
ifstream ifs
;
ifs
.open(path
,ios
::in
);
if (!ifs
.is_open())
{
cout
<< "文件打开失败" << endl
;return "";
}
string res
;
while (getline(ifs
, res
))
{
cout
<<"读取的信息为: "<< res
<< endl
;
}
ifs
.close();
return res
;
}
void writeFile(string path
,string data
)
{
ofstream
ofs(path
, ios
::out
);
ofs
<<data
<<endl
;
ofs
.close();
}
void writeFile(string path
,char data
)
{
ofstream
ofs(path
, ios
::app
);
ofs
<<data
;
ofs
.close();
}
int main(){
string s
= readFile("源文件.txt");
priority_queue
<HTNode
> queue
= count(s
);
show(queue
);
CreateHuffmanTree(queue
);
string bulid
="";
HTNode root
= queue
.top();
getCodes(&root
,"",bulid
);
printCode(huffmanCode
);
string res
= BecomeCode(huffmanCode
,s
);
writeFile("编码文件.txt",res
);
deCode(huffmanCode
,res
);
return 0;
}