使用赫夫曼编码压缩及解压文件

压缩文件

代码展示

节点类

package demo9;

public class Node implements Comparable{
    Byte data;
    int weight;
    Node left;
    Node right;
    public Node(Byte data,int weight){
        this.data = data;
        this.weight = weight;
    }

    @Override
    public String toString() {
        return "Node{" + "data=" + data + ", weight=" + weight + '}';
    }

    @Override
    public int compareTo(Node o) {
        return o.weight-this.weight;
    }
}

测试类

package demo9;

import java.io.*;
import java.util.*;

public class TestHuffmanCode {

    public static void main(String[] args) {

        String src="1.jpg";
        String dst="2.zip";
        try {
            zipFile(src,dst);
        } catch (IOException e) {
            e.printStackTrace();
        }
    }

    /**
     *  压缩文件
     * @param src
     * @param dst
     * @throws IOException
     */
    public static void zipFile(String src, String dst) throws IOException {
        //创建一个输入流
        InputStream is = new FileInputStream(src);
        //创建一个和输入流指向的文件大小一样的byte数组
        byte[] b = new byte[is.available()];
        //读取文件内容
        is.read(b);
        is.close();
        //使用赫夫曼编码进行编码
        byte[] byteZip = huffmanZip(b);
        //输出流
        OutputStream os = new FileOutputStream(dst);
        ObjectOutputStream oos = new ObjectOutputStream(os);
        //把压缩后的byte数组写入文件
        oos.writeObject(byteZip);
        //把赫夫曼编码表写入文件
        oos.writeObject(huffCodes);
        oos.close();
        os.close();

    }

    /**
     * 使用指定的赫夫曼编码表进行解码
     * @param huffCodes
     * @param bytes
     * @return
     */
    private static byte[] decode(Map huffCodes, byte[] bytes) {
        StringBuilder sb = new StringBuilder();
        //把byte数组转为一个二进制的字符串
        for(int i=0;i map = new HashMap<>();
        for(Map.Entry entry:huffCodes.entrySet()){
            map.put(entry.getValue(),entry.getKey());
        }
        //创建一个集合,用于存byte
        List list = new ArrayList<>();
        //处理字符串
        for(int i=0;i nodes = getNodes(bytes);
        //创建一棵赫夫曼树
        Node tree = createHuffmanTree(nodes);
        //创建一个赫夫曼编码表
        Map huffCodes = getCodes(tree);
        //编码
        byte[] b = zip(bytes,huffCodes);
        return b;
    }

    /**
     * 进行赫夫曼编码
     * @param bytes
     * @param huffCodes
     * @return
     */
    private static byte[] zip(byte[] bytes, Map huffCodes) {
        StringBuilder sb =new StringBuilder();
        //把需要压缩的byte数组处理成一个二进制的字符串
        for(byte b:bytes){
            sb.append(huffCodes.get(b));
        }
        //定义长度
        int len;
        if(sb.length()%8==0){
            len=sb.length()/8+1;
        }else{
            len=sb.length()/8+1;
        }
//        System.out.println(sb.toString());
        //用于存储压缩后的byte
        byte[] by = new byte[len];
        //记录新byte的位置
        int index = 0;
        for(int i=0;isb.length()){
                strByte = sb.substring(i);
            }else{
                strByte = sb.substring(i, i+8);
            }
            byte byt = (byte)Integer.parseInt(strByte,2);
//            System.out.println(strByte+":"+byt);
            by[index]=byt;
            index++;
        }
        return by;
    }

    //用于临时存储路径
    static StringBuilder sb = new StringBuilder();
    //用于存储赫夫曼编码
    static Map huffCodes = new HashMap<>();
    /**
     * 根据赫夫曼树获取赫夫曼编码
     * @param tree
     * @return
     */
    private static Map getCodes(Node tree) {
        if(tree==null){
            return null;
        }
        getCodes(tree.left,"0",sb);
        getCodes(tree.right,"1",sb);
        return huffCodes;
    }

    private static void getCodes(Node node, String code, StringBuilder sb) {
        StringBuilder sb2 = new StringBuilder(sb);
        sb2.append(code);
        if(node.data==null){
            getCodes(node.left,"0",sb2);
            getCodes(node.right,"1",sb2);
        }else{
            huffCodes.put(node.data,sb2.toString());
        }
    }

    /**
     * 创建赫夫曼树
     * @param nodes
     * @return
     */
    private static Node createHuffmanTree(List nodes) {
        while(nodes.size()>1){
        //排序
        Collections.sort(nodes);
        //取出两个权值最低的二叉树
        Node left = nodes.get(nodes.size()-1);
        Node right = nodes.get(nodes.size()-2);
        //创建一棵新的二叉树
        Node parent = new Node(null,left.weight+right.weight);
        //把之前取出来的两棵二叉树设置为新创建的二叉树的子树
        parent.left=left;
        parent.right=right;
        //把前面取出来的两棵二叉树删除
        nodes.remove(left);
        nodes.remove(right);
        //把新创建的二叉树放入集合中
        nodes.add(parent);
        }
        return nodes.get(0);
    }

    /**
     * 把byte数组转为node集合
     * @param bytes
     * @return
     */
    private static List getNodes(byte[] bytes) {
    List nodes = new ArrayList<>();
    Map counts = new HashMap<>();
    //统计每一个byte出现的次数
    for(byte b:bytes){
        Integer count = counts.get(b);
        if(count==null){
            counts.put(b,1);
        }else{
            counts.put(b,count+1);
        }
    }
    //把每一个键值对转为一个node对象
    for(Map.Entry entry:counts.entrySet()){
        nodes.add(new Node(entry.getKey(),entry.getValue()));
    }
    return nodes;
    }
}

解压文件

代码展示

节点类

package demo9;

public class Node implements Comparable{
    Byte data;
    int weight;
    Node left;
    Node right;
    public Node(Byte data,int weight){
        this.data = data;
        this.weight = weight;
    }

    @Override
    public String toString() {
        return "Node{" + "data=" + data + ", weight=" + weight + '}';
    }

    @Override
    public int compareTo(Node o) {
        return o.weight-this.weight;
    }
}

测试类

package demo9;

import java.io.*;
import java.util.*;

public class TestHuffmanCode {

    public static void main(String[] args) {
    
		//压缩文件 
//        String src="1.bmp";
//        String dst="2.zip";
//        try {
//            zipFile(src,dst);
//        } catch (IOException e) {
//            e.printStackTrace();
//        }
        //解压文件
        try {
            unZip("2.zip","3.bmp");
        } catch (Exception e) {
            e.printStackTrace();
        }
    }

        /**
     * 文件的解压
     * @param src
     * @param dst
     */
    public static void unZip(String src, String dst) throws Exception {
        //创建一个输入流
        InputStream is = new FileInputStream("2.zip");
        ObjectInputStream ois = new ObjectInputStream(is);
        //读取byte数组
        byte[] b = (byte[]) ois.readObject();
        //读取赫夫曼编码表
        Map codes = (Map) ois.readObject();
        ois.close();
        is.close();
        //解码
        byte[] bytes = decode(codes, b);
        //创建一个输出流
        OutputStream os = new FileOutputStream(dst);
        //写出数据
        os.write(bytes);
        os.close();
    }

    /**
     *  压缩文件
     * @param src
     * @param dst
     * @throws IOException
     */
    public static void zipFile(String src, String dst) throws IOException {
        //创建一个输入流
        InputStream is = new FileInputStream(src);
        //创建一个和输入流指向的文件大小一样的byte数组
        byte[] b = new byte[is.available()];
        //读取文件内容
        is.read(b);
        is.close();
        //使用赫夫曼编码进行编码
        byte[] byteZip = huffmanZip(b);
        //输出流
        OutputStream os = new FileOutputStream(dst);
        ObjectOutputStream oos = new ObjectOutputStream(os);
        //把压缩后的byte数组写入文件
        oos.writeObject(byteZip);
        //把赫夫曼编码表写入文件
        oos.writeObject(huffCodes);
        oos.close();
        os.close();

    }


    /**
     * 使用指定的赫夫曼编码表进行解码
     * @param huffCodes
     * @param bytes
     * @return
     */
    private static byte[] decode(Map huffCodes, byte[] bytes) {
        StringBuilder sb = new StringBuilder();
        //把byte数组转为一个二进制的字符串
        for(int i=0;i map = new HashMap<>();
        for(Map.Entry entry:huffCodes.entrySet()){
            map.put(entry.getValue(),entry.getKey());
        }
        //创建一个集合,用于存byte
        List list = new ArrayList<>();
        //处理字符串
        for(int i=0;i nodes = getNodes(bytes);
        //创建一棵赫夫曼树
        Node tree = createHuffmanTree(nodes);
        //创建一个赫夫曼编码表
        Map huffCodes = getCodes(tree);
        //编码
        byte[] b = zip(bytes,huffCodes);
        return b;
    }

    /**
     * 进行赫夫曼编码
     * @param bytes
     * @param huffCodes
     * @return
     */
    private static byte[] zip(byte[] bytes, Map huffCodes) {
        StringBuilder sb =new StringBuilder();
        //把需要压缩的byte数组处理成一个二进制的字符串
        for(byte b:bytes){
            sb.append(huffCodes.get(b));
        }
        //定义长度
        int len;
        if(sb.length()%8==0){
            len=sb.length()/8+1;
        }else{
            len=sb.length()/8+1;
        }
//        System.out.println(sb.toString());
        //用于存储压缩后的byte
        byte[] by = new byte[len];
        //记录新byte的位置
        int index = 0;
        for(int i=0;isb.length()){
                strByte = sb.substring(i);
            }else{
                strByte = sb.substring(i, i+8);
            }
            byte byt = (byte)Integer.parseInt(strByte,2);
//            System.out.println(strByte+":"+byt);
            by[index]=byt;
            index++;
        }
        return by;
    }

    //用于临时存储路径
    static StringBuilder sb = new StringBuilder();
    //用于存储赫夫曼编码
    static Map huffCodes = new HashMap<>();
    /**
     * 根据赫夫曼树获取赫夫曼编码
     * @param tree
     * @return
     */
    private static Map getCodes(Node tree) {
        if(tree==null){
            return null;
        }
        getCodes(tree.left,"0",sb);
        getCodes(tree.right,"1",sb);
        return huffCodes;
    }

    private static void getCodes(Node node, String code, StringBuilder sb) {
        StringBuilder sb2 = new StringBuilder(sb);
        sb2.append(code);
        if(node.data==null){
            getCodes(node.left,"0",sb2);
            getCodes(node.right,"1",sb2);
        }else{
            huffCodes.put(node.data,sb2.toString());
        }
    }

    /**
     * 创建赫夫曼树
     * @param nodes
     * @return
     */
    private static Node createHuffmanTree(List nodes) {
        while(nodes.size()>1){
        //排序
        Collections.sort(nodes);
        //取出两个权值最低的二叉树
        Node left = nodes.get(nodes.size()-1);
        Node right = nodes.get(nodes.size()-2);
        //创建一棵新的二叉树
        Node parent = new Node(null,left.weight+right.weight);
        //把之前取出来的两棵二叉树设置为新创建的二叉树的子树
        parent.left=left;
        parent.right=right;
        //把前面取出来的两棵二叉树删除
        nodes.remove(left);
        nodes.remove(right);
        //把新创建的二叉树放入集合中
        nodes.add(parent);
        }
        return nodes.get(0);
    }

    /**
     * 把byte数组转为node集合
     * @param bytes
     * @return
     */
    private static List getNodes(byte[] bytes) {
    List nodes = new ArrayList<>();
    Map counts = new HashMap<>();
    //统计每一个byte出现的次数
    for(byte b:bytes){
        Integer count = counts.get(b);
        if(count==null){
            counts.put(b,1);
        }else{
            counts.put(b,count+1);
        }
    }
    //把每一个键值对转为一个node对象
    for(Map.Entry entry:counts.entrySet()){
        nodes.add(new Node(entry.getKey(),entry.getValue()));
    }
    return nodes;
    }
}

你可能感兴趣的:(数据结构和算法)