25.18 (Compress a file) Write a program that compresses a source file into a target file using the Huffman coding method. First use ObjectOutputStream to output the Huffman codes into the target file, and then use BitOutputStream in
Programming Exercise 17.17 to output the encoded binary contents to the tar-
get file. Pass the files from the command line using the following command:
java Exercise25_18 sourcefile targetfile.
Programming Exercise 17.17 to output the encoded binary contents to the tar-
get file. Pass the files from the command line using the following command:
java Exercise25_18 sourcefile targetfile.
import java.io.BufferedInputStream; import java.io.DataInputStream; import java.io.DataOutputStream; import java.io.File; import java.io.FileInputStream; import java.io.FileNotFoundException; import java.io.FileOutputStream; import java.io.IOException; import java.io.ObjectOutputStream; import java.util.ArrayList; public class Exercise25_18 { public static void main(String[] args) throws IOException { if (args.length != 2) { System.out.println("Usage: java Exercise25_18 sourceFile targetFile"); System.exit(1); } File sourceFile = new File(args[0]); if (!sourceFile.exists()) { System.out.println("File " + args[0] + " does not exist"); System.exit(2); } DataInputStream sourceFileStream = new DataInputStream(new BufferedInputStream(new FileInputStream(sourceFile))); int size = sourceFileStream.available(); byte[] b = new byte[size]; sourceFileStream.read(b); sourceFileStream.close(); String text = new String(b); int[] counts = getCharacterFrequency(text); Tree tree = getHuffmanTree(counts); String[] codes = getCode(tree.root); StringBuilder result = new StringBuilder(); for (int i = 0; i < text.length(); i++) { result.append(codes[text.charAt(i)]); } ObjectOutputStream codesOutput = new ObjectOutputStream(new FileOutputStream(args[1])); codesOutput.writeObject(codes); codesOutput.writeInt(result.length()); codesOutput.close(); BitOutputStream output = new BitOutputStream(new File(args[1])); output.writeBit(result.toString()); output.close(); } static class BitOutputStream { private ArrayList<Integer> bits = new ArrayList<>(); private DataOutputStream output; public BitOutputStream(File file) throws FileNotFoundException { output = new DataOutputStream(new FileOutputStream(file, true)); } public void writeBit(char bit) throws IOException { if (bit == '0') { bits.add(0); } else { bits.add(1); } if (bits.size() == 8) { output.writeByte(getByte()); bits.clear(); } } public void writeBit(String bit) throws IOException { for (int i = 0; i < bit.length(); i++) { writeBit(bit.charAt(i)); } } public void close() throws IOException { while(bits.size() != 0) { writeBit('0'); } output.close(); } private byte getByte() { int sum = 0; for (int i = 7, number = 1; i >= 0; i--, number*= 2) { sum += bits.get(i) * number; } return (byte)sum; } } /** * Get Huffman codes for the characters This method is called once after a * Huffman tree is built */ public static String[] getCode(Tree.Node root) { if (root == null) return null; String[] codes = new String[2 * 128]; assignCode(root, codes); return codes; } /* Recursively get codes to the leaf node */ private static void assignCode(Tree.Node root, String[] codes) { if (root.left != null) { root.left.code = root.code + "0"; assignCode(root.left, codes); root.right.code = root.code + "1"; assignCode(root.right, codes); } else { codes[(int) root.element] = root.code; } } /** Get a Huffman tree from the codes */ public static Tree getHuffmanTree(int[] counts) { // Create a heap to hold trees Heap<Tree> heap = new Heap<Tree>(); // Defined in Listing 24.10 for (int i = 0; i < counts.length; i++) { if (counts[i] > 0) heap.add(new Tree(counts[i], (char) i)); // A leaf node tree } while (heap.getSize() > 1) { Tree t1 = heap.remove(); // Remove the smallest weight tree Tree t2 = heap.remove(); // Remove the next smallest weight heap.add(new Tree(t1, t2)); // Combine two trees } return heap.remove(); // The final tree } /** Get the frequency of the characters */ public static int[] getCharacterFrequency(String text) { int[] counts = new int[256]; // 256 ASCII characters for (int i = 0; i < text.length(); i++) counts[(int) text.charAt(i)]++; // Count the character in text return counts; } /** Define a Huffman coding tree */ public static class Tree implements Comparable<Tree> { Node root; // The root of the tree /** Create a tree with two subtrees */ public Tree(Tree t1, Tree t2) { root = new Node(); root.left = t1.root; root.right = t2.root; root.weight = t1.root.weight + t2.root.weight; } /** Create a tree containing a leaf node */ public Tree(int weight, char element) { root = new Node(weight, element); } @Override /** Compare trees based on their weights */ public int compareTo(Tree t) { if (root.weight < t.root.weight) // Purposely reverse the order return 1; else if (root.weight == t.root.weight) return 0; else return -1; } public class Node { char element; // Stores the character for a leaf node int weight; // weight of the subtree rooted at this node Node left; // Reference to the left subtree Node right; // Reference to the right subtree String code = ""; // The code of this node from the root /** Create an empty node */ public Node() { } /** Create a node with the specified weight and character */ public Node(int weight, char element) { this.weight = weight; this.element = element; } } } static class Heap<E extends Comparable<E>> { private java.util.ArrayList<E> list = new java.util.ArrayList<E>(); /** Create a default heap */ public Heap() { } /** Create a heap from an array of objects */ public Heap(E[] objects) { for (int i = 0; i < objects.length; i++) add(objects[i]); } /** Add a new object into the heap */ public void add(E newObject) { list.add(newObject); // Append to the heap int currentIndex = list.size() - 1; // The index of the last node while (currentIndex > 0) { int parentIndex = (currentIndex - 1) / 2; // Swap if the current object is greater than its parent if (list.get(currentIndex).compareTo(list.get(parentIndex)) > 0) { E temp = list.get(currentIndex); list.set(currentIndex, list.get(parentIndex)); list.set(parentIndex, temp); } else break; // the tree is a heap now currentIndex = parentIndex; } } /** Remove the root from the heap */ public E remove() { if (list.size() == 0) return null; E removedObject = list.get(0); list.set(0, list.get(list.size() - 1)); list.remove(list.size() - 1); int currentIndex = 0; while (currentIndex < list.size()) { int leftChildIndex = 2 * currentIndex + 1; int rightChildIndex = 2 * currentIndex + 2; // Find the maximum between two children if (leftChildIndex >= list.size()) break; // The tree is a heap int maxIndex = leftChildIndex; if (rightChildIndex < list.size()) { if (list.get(maxIndex).compareTo(list.get(rightChildIndex)) < 0) { maxIndex = rightChildIndex; } } // Swap if the current node is less than the maximum if (list.get(currentIndex).compareTo(list.get(maxIndex)) < 0) { E temp = list.get(maxIndex); list.set(maxIndex, list.get(currentIndex)); list.set(currentIndex, temp); currentIndex = maxIndex; } else break; // The tree is a heap } return removedObject; } /** Get the number of nodes in the tree */ public int getSize() { return list.size(); } } }
No comments :
Post a Comment