利用哈夫曼树及哈夫曼编码来查询输入的字符的最少编码-C++技术网

利用哈夫曼树及哈夫曼编码来查询输入的字符的最少编码

更新时间：2016-04-11 21:06:44浏览次数：1+次

上个礼拜，一个同学需要帮忙做个哈弗曼的题目。该题目首先是根据输入的不同的字符的个数，而后利用哈夫曼编码写出最优的编码方式。其次，还有一个什么要求，我忘了.....不过还是实现出来了统计输入的字符字数，并根据字数来生成最优的哈夫曼编码。
首先，对于本文的哈夫曼树及其哈夫曼编码部分，需要感谢这篇文章的作者《哈夫曼编码与解码(C语言实现)》（http://touch-2011.iteye.com/blog/1058800），虽然，我刚刚直接复制之后不能运行，还是再改了一些的基础上才能运行的。不过总的来说，还是谢谢啦。
总的来说，哈夫曼树及哈弗曼编码都是一个总的思想。就是主要的算法问题。虽然我也会主要的算法，但是实现出来特别坑.....

先看看实现出来的吧：

对于本文的代码，你需要有一定的STL知识，可以到本站里面找相应的文章，我写了很多关于STL的文章。

下面我们先看代码：
#include <stdio.h>
#include "windows.h"
#include "iostream"
#include "algorithm"
#include "windows.h"
#include "vector"
#include "iterator"

using namespace std;


#define MAXBIT      100
#define MAXVALUE  10000
#define MAXLEAF     30
#define MAXNODE    MAXLEAF*2 -1

typedef struct 
{
    int bit[MAXBIT];
    int start;
} HCodeType;        /* 编码结构体 */
typedef struct
{
    int weight;
    int parent;
    int lchild;
    int rchild;
} HNodeType;        /* 结点结构体 */

/* 构造一颗哈夫曼树 */
void HuffmanTree (HNodeType HuffNode[MAXNODE],  int n)
{ 
    /* i、j： 循环变量，m1、m2：构造哈夫曼树不同过程中两个最小权值结点的权值，
        x1、x2：构造哈夫曼树不同过程中两个最小权值结点在数组中的序号。*/
    int i, j, m1, m2, x1, x2;
    /* 初始化存放哈夫曼树数组 HuffNode[] 中的结点 */
    for (i=0; i<2*n-1; i++)
    {
        HuffNode[i].weight = 0;
        HuffNode[i].parent =-1;
        HuffNode[i].lchild =-1;
        HuffNode[i].lchild =-1;
    } /* end for */

    /* 输入 n 个叶子结点的权值 */
    for (i=0; i<n; i++)
    {
        printf ("Please input weight of leaf node %d: \n", i);
        scanf_s("%d", &HuffNode[i].weight);
    } /* end for */

    /* 循环构造 Huffman 树 */
    for (i=0; i<n-1; i++)
    {
        m1=m2=MAXVALUE;     /* m1、m2中存放两个无父结点且结点权值最小的两个结点 */
        x1=x2=0;
        /* 找出所有结点中权值最小、无父结点的两个结点，并合并之为一颗二叉树 */
        for (j=0; j<n+i; j++)
        {
            if (HuffNode[j].weight < m1 && HuffNode[j].parent==-1)
            {
                m2=m1; //方便判断数组中的最小值
                x2=x1; 
                m1=HuffNode[j].weight;
                x1=j;
            }
            else if (HuffNode[j].weight < m2 && HuffNode[j].parent==-1)
            {
                m2=HuffNode[j].weight;
                x2=j;
            }
        } /* end for */
            /* 设置找到的两个子结点 x1、x2 的父结点信息 */
        HuffNode[x1].parent  = n+i;
        HuffNode[x2].parent  = n+i;
        HuffNode[n+i].weight = HuffNode[x1].weight + HuffNode[x2].weight;
        HuffNode[n+i].lchild = x1;
        HuffNode[n+i].rchild = x2;

        printf ("x1.weight and x2.weight in round %d: %d, %d\n", i+1, HuffNode[x1].weight, HuffNode[x2].weight);  /* 用于测试 */
        printf ("\n");
    } /* end for */
} /* end HuffmanTree */

int main()
{
    HNodeType HuffNode[MAXNODE];            /* 定义一个结点结构体数组 */
    HCodeType HuffCode[MAXLEAF],  cd;       /* 定义一个编码结构体数组， 同时定义一个临时变量来存放求解编码时的信息 */
    int i, j, c, p, n;
    char cha;
	cout<<"请输入你想统计的字符的个数:"<<endl;
	cin>>cha;

	vector<char> coll;
	copy(std::istream_iterator<char>(cin),std::istream_iterator<char>(),back_inserter(coll));
	n=count(coll.begin(),coll.end(),cha);//利用STL中的count函数统计个数......
	cout<<"字符的个数有："<<n<<endl;

    HuffmanTree (HuffNode, n);
    
    for (i=0; i < n; i++)
    {
        cd.start = n-1;
        c = i;
        p = HuffNode[c].parent;
        while (p != -1)   /* 父结点存在 */
        {
            if (HuffNode[p].lchild == c)
                cd.bit[cd.start] = 0;
            else
                cd.bit[cd.start] = 1;
            cd.start--;        /* 求编码的低一位 */
            c=p;                    
            p=HuffNode[c].parent;    /* 设置下一循环条件 */
        } /* end while */
        
        /* 保存求出的每个叶结点的哈夫曼编码和编码的起始位 */
        for (j=cd.start+1; j<n; j++)
        { HuffCode[i].bit[j] = cd.bit[j];}
        HuffCode[i].start = cd.start;
    } /* end for */
    
    /* 输出已保存好的所有存在编码的哈夫曼编码 */
    for (i=0; i<n; i++)
    {
        printf ("%d 's Huffman code is: ", i);
        for (j=HuffCode[i].start+1; j < n; j++)
        {
            printf ("%d", HuffCode[i].bit[j]);
        }
        printf ("\n");
    }
	system("pause");

    return 0;
}