0

I'm trying to compress a Base64 String using the java.util.zip.GZIPInputStream and Deflater clases. My problem is that after compression the size is not less from both cases. For the first case with the GZIPInputStream the size is bigger, and in the second case with the Deflater class the size is almost the same.

The output of my code is:

Original String Size: 8799
CompressedGZip String Size: 8828
UncompressedGZip String Size: 8799
Original_String_Length=8799
Compressed_String_Length Deflater=8812, Compression_Ratio=-0.147%
Decompressed_String_Length Deflater=8799 == Original_String_Length (8799)
Original_String == Decompressed_String=True

As you can see in both cases the compressed string is not less. I need to compress the input base64 String because in some cases is too long. Is there any way to achieve this?

This is my code:

       private static String compressFileGZip(String data) {
        try {

            // Create an output stream, and a gzip stream to wrap over.
            ByteArrayOutputStream bos = new ByteArrayOutputStream(data.length());
            GZIPOutputStream gzip = new GZIPOutputStream(bos);

            // Compress the input string
            gzip.write(data.getBytes());
            gzip.close();
            byte[] compressed = bos.toByteArray();
            bos.close();

            // Convert to base64
            compressed = Base64.getEncoder().encode(compressed);

            // return the newly created string
            return new String(compressed);
        } catch(IOException e) {

            return null;
        }
    }

    private static String decompressFileGZip(String compressedText) throws IOException {
        ByteArrayOutputStream stream = new ByteArrayOutputStream();
        // get the bytes for the compressed string
        byte[] compressed = compressedText.getBytes("UTF8");

        // convert the bytes from base64 to normal string
        Base64.Decoder d = Base64.getDecoder();
        compressed = d.decode(compressed);

        // decode.
        final int BUFFER_SIZE = 32;

        ByteArrayInputStream is = new ByteArrayInputStream(compressed);

        GZIPInputStream gis = new GZIPInputStream(is, BUFFER_SIZE);

        StringBuilder string = new StringBuilder();

        byte[] data = new byte[BUFFER_SIZE];

        int bytesRead;

        while ((bytesRead = gis.read(data)) != -1)
        {
            string.append(new String(data, 0, bytesRead));
        }
        gis.close();
        is.close();
        return string.toString();
    }

     public static void main(String args[]) {
        String input = "";
        String compressedGZip = compressFileGZip(input);
        String compressedDeflater = null;
        String uncompressedGZip = null;
        String decompressed = null;
        try {
            compressedDeflater = compress(input);
            uncompressedGZip = decompressFileGZip(compressedGZip);
            decompressed = decompress(decodeBase64(compressedDeflater));
        } catch (IOException e) {
            e.printStackTrace();
        } catch (Exception e) {
            e.printStackTrace();
        }
        System.out.println("Original String Size: " + input.length());
        System.out.println("CompressedGZip String Size: " + compressedGZip.length());
        System.out.println("UncompressedGZip String Size: " + uncompressedGZip.length());

        Integer savedLength = input.length() - compressedDeflater.length();
        Double saveRatio = (new Double(savedLength) * 100) / input.length();
        String ratioString = saveRatio.toString() + "00000000";
        ratioString = ratioString.substring(0, ratioString.indexOf(".") + 4);
        println("Original_String_Length=" + input.length());
        println("Compressed_String_Length Deflater=" + compressedDeflater.length() + ", Compression_Ratio=" + ratioString + "%");
        println("Decompressed_String_Length Deflater=" + decompressed.length() + " == Original_String_Length (" + input.length() + ")");
        println("Original_String == Decompressed_String=" + (input.equals(decompressed) ? "True" : "False"));
        // end
    }


    public static String compress(String str) throws Exception {
        return compress(str.getBytes("UTF-8"));
    }

    public static String compress(byte[] bytes) throws Exception {
        Deflater deflater = new Deflater();
        deflater.setInput(bytes);
        deflater.finish();
        //deflater.deflate(bytes, 2, bytes.length);
        ByteArrayOutputStream bos = new ByteArrayOutputStream(bytes.length);
        byte[] buffer = new byte[1024];
        while(!deflater.finished()) {
            int count = deflater.deflate(buffer);
            bos.write(buffer, 0, count);
        }
        bos.close();
        byte[] output = bos.toByteArray();
        return encodeBase64(output);
    }

    public static String decompress(byte[] bytes) throws Exception {
        Inflater inflater = new Inflater();
        inflater.setInput(bytes);
        ByteArrayOutputStream bos = new ByteArrayOutputStream(bytes.length);
        byte[] buffer = new byte[1024];
        while (!inflater.finished()) {
            int count = inflater.inflate(buffer);
            bos.write(buffer, 0, count);
        }
        bos.close();
        byte[] output = bos.toByteArray();
        return new String(output);
    }

    public static String encodeBase64(byte[] bytes) throws Exception {
        BASE64Encoder base64Encoder = new BASE64Encoder();
        return base64Encoder.encodeBuffer(bytes).replace("\r\n", "").replace("\n", "");
    }

    public static byte[] decodeBase64(String str) throws Exception {
        BASE64Decoder base64Decoder = new BASE64Decoder();
        return base64Decoder.decodeBuffer(str);
    }

    public static void println(Object o) {
        System.out.println("" + o);
    }
rasilvap
  • 1,771
  • 3
  • 31
  • 70
  • 3
    You might want to read this [`answer`](https://stackoverflow.com/a/38126771) and reconsider your approach. You also can set the compression level on the Deflater, but that won't make a difference for that kind of data. – second Aug 31 '19 at 23:56
  • If you're able to transmit arbitrary byte data, why are you encoding in Base64 in the first place? – chrylis -cautiouslyoptimistic- Sep 01 '19 at 00:55
  • I am getting the image as a Base64 String and I have to store this value in the database, I would like to know if it is possible to compress this long String in a shorter text, so that I can't apply the strategy of compress first and encode second, if it is not possible what strategy can I apply? – rasilvap Sep 01 '19 at 02:51
  • 2
    @rasilvap The [answer linked to by second](https://stackoverflow.com/questions/57742052/compressing-base64-string-is-not-of-less-size#comment101923538_57742052) shows that Base64 always compresses badly, because the encoding obfuscates compressionable patterns. So to compress the data, do it before the Base64 encoding. Of course, most *image* formats are already compressed, so there is nothing you can do. It is already as compressed as it's going to get. – Andreas Sep 01 '19 at 03:01

0 Answers0