|
|
|
// gzip.java
|
|
|
|
// -------------------------------------
|
|
|
|
// (C) by Michael Peter Christen; mc@yacy.net
|
|
|
|
// first published on http://www.anomic.de
|
|
|
|
// Frankfurt, Germany, 2004
|
|
|
|
//
|
|
|
|
// $LastChangedDate$
|
|
|
|
// $LastChangedRevision$
|
|
|
|
// $LastChangedBy$
|
|
|
|
//
|
|
|
|
// This program is free software; you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU General Public License as published by
|
|
|
|
// the Free Software Foundation; either version 2 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful,
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU General Public License
|
|
|
|
// along with this program; if not, write to the Free Software
|
|
|
|
// Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
|
|
|
|
|
|
package net.yacy.utils;
|
|
|
|
|
|
|
|
import java.io.BufferedInputStream;
|
|
|
|
import java.io.BufferedOutputStream;
|
|
|
|
import java.io.ByteArrayInputStream;
|
|
|
|
import java.io.ByteArrayOutputStream;
|
|
|
|
import java.io.File;
|
|
|
|
import java.io.FileInputStream;
|
|
|
|
import java.io.FileNotFoundException;
|
|
|
|
import java.io.FileOutputStream;
|
|
|
|
import java.io.IOException;
|
|
|
|
import java.io.InputStream;
|
|
|
|
import java.io.OutputStream;
|
|
|
|
import java.util.zip.GZIPInputStream;
|
|
|
|
import java.util.zip.GZIPOutputStream;
|
|
|
|
|
|
|
|
import net.yacy.cora.document.encoding.UTF8;
|
|
|
|
import net.yacy.cora.util.ConcurrentLog;
|
|
|
|
|
|
|
|
|
|
|
|
public class gzip {
|
|
|
|
|
|
|
|
private static ConcurrentLog logger = new ConcurrentLog("GZIP");
|
|
|
|
|
|
|
|
public static void gzipFile(final String inFile, final String outFile) {
|
|
|
|
try {
|
|
|
|
final InputStream fin = new BufferedInputStream(new FileInputStream(inFile));
|
|
|
|
final OutputStream fout = new GZIPOutputStream(new BufferedOutputStream(new FileOutputStream(outFile), 1024));
|
|
|
|
copy(fout, fin, 1024);
|
|
|
|
fin.close();
|
|
|
|
fout.close();
|
|
|
|
} catch (final FileNotFoundException e) {
|
|
|
|
logger.warn("ERROR: file '" + inFile + "' not found", e);
|
|
|
|
} catch (final IOException e) {
|
|
|
|
logger.warn("ERROR: IO trouble ",e);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
public static File gunzipFile(final File in) {
|
|
|
|
assert in.getName().endsWith(".gz");
|
|
|
|
final String on = in.getName().substring(0, in.getName().length() - 3);
|
|
|
|
final File outf = new File(in.getParent(), on);
|
|
|
|
gunzipFile(in, outf);
|
|
|
|
return outf;
|
|
|
|
}
|
|
|
|
|
|
|
|
public static void gunzipFile(final File inFile, final File outFile) {
|
|
|
|
try {
|
|
|
|
final InputStream fin = new GZIPInputStream(new BufferedInputStream(new FileInputStream(inFile)));
|
|
|
|
final OutputStream fout = new BufferedOutputStream(new FileOutputStream(outFile));
|
|
|
|
copy(fout, fin, 1024);
|
|
|
|
fin.close();
|
|
|
|
fout.close();
|
|
|
|
} catch (final FileNotFoundException e) {
|
|
|
|
logger.warn("ERROR: file '" + inFile + "' not found", e);
|
|
|
|
} catch (final IOException e) {
|
|
|
|
logger.warn("ERROR: IO trouble ",e);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
public static byte[] gzipString(final String in) {
|
|
|
|
try {
|
|
|
|
final InputStream fin = new ByteArrayInputStream(in.getBytes("UTF8"));
|
|
|
|
final int buffersize = Math.min(1024, in.length());
|
|
|
|
final ByteArrayOutputStream baos = new ByteArrayOutputStream(buffersize);
|
|
|
|
final OutputStream fout = new GZIPOutputStream(baos, Math.max(buffersize, 512));
|
|
|
|
copy(fout, fin, 1024);
|
|
|
|
fin.close();
|
|
|
|
fout.close();
|
|
|
|
return baos.toByteArray();
|
|
|
|
} catch (final IOException e) {
|
|
|
|
logger.warn("ERROR: IO trouble ",e);
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
public static String gunzipString(final byte[] in) throws IOException {
|
|
|
|
final InputStream fin = new GZIPInputStream(new ByteArrayInputStream(in));
|
|
|
|
final ByteArrayOutputStream fout = new ByteArrayOutputStream(in.length / 3);
|
|
|
|
copy(fout, fin, 1024);
|
|
|
|
fin.close();
|
|
|
|
fout.close();
|
|
|
|
return UTF8.String(fout.toByteArray());
|
|
|
|
}
|
|
|
|
|
|
|
|
private static void copy(final OutputStream out, final InputStream in, final int bufferSize) throws IOException {
|
|
|
|
final InputStream bIn = new BufferedInputStream(in, bufferSize);
|
|
|
|
final OutputStream bOut = new BufferedOutputStream(out, bufferSize);
|
|
|
|
final byte[] buf = new byte[bufferSize];
|
|
|
|
int n;
|
|
|
|
while ((n = bIn.read(buf)) > 0) bOut.write(buf, 0, n);
|
|
|
|
bIn.close();
|
|
|
|
bOut.close();
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// some static helper methods
|
|
|
|
public static void saveGzip(final File f, final byte[] content) throws IOException {
|
|
|
|
java.util.zip.GZIPOutputStream gzipout = null;
|
|
|
|
try {
|
|
|
|
f.getParentFile().mkdirs();
|
|
|
|
gzipout = new java.util.zip.GZIPOutputStream(new FileOutputStream(f));
|
|
|
|
gzipout.write(content, 0, content.length);
|
|
|
|
} finally {
|
|
|
|
if (gzipout!=null)try{gzipout.close();}catch(final Exception e){}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
public static byte[] loadGzip(final File f) throws IOException {
|
|
|
|
java.util.zip.GZIPInputStream gzipin = null;
|
|
|
|
try {
|
|
|
|
gzipin = new java.util.zip.GZIPInputStream(new FileInputStream(f));
|
|
|
|
byte[] result = new byte[1024];
|
|
|
|
final byte[] buffer = new byte[512];
|
|
|
|
byte[] b;
|
|
|
|
int len = 0;
|
|
|
|
int last;
|
|
|
|
while ((last = gzipin.read(buffer, 0, buffer.length)) > 0) {
|
|
|
|
// assert the buffer to the result
|
|
|
|
while (result.length - len < last) {
|
|
|
|
// the result array is too small, increase space
|
|
|
|
b = new byte[result.length * 2];
|
|
|
|
System.arraycopy(result, 0, b, 0, len);
|
|
|
|
result = b; b = null;
|
|
|
|
}
|
|
|
|
// copy the last read
|
|
|
|
System.arraycopy(buffer, 0, result, len, last);
|
|
|
|
len += last;
|
|
|
|
}
|
|
|
|
gzipin.close();
|
|
|
|
// finished with reading. now cut the result to the right size
|
|
|
|
b = new byte[len];
|
|
|
|
System.arraycopy(result, 0, b, 0, len);
|
|
|
|
return b;
|
|
|
|
} finally {
|
|
|
|
if (gzipin != null) try{gzipin.close();}catch(final Exception e){}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
private static void help() {
|
|
|
|
System.out.println("AnomicGzip (2004) by Michael Christen");
|
|
|
|
System.out.println("usage: gzip [-u] <file> [<target-file>]");
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
public static void main(final String[] s) {
|
|
|
|
if (s.length == 0) {
|
|
|
|
help();
|
|
|
|
System.exit(0);
|
|
|
|
}
|
|
|
|
if ((s[0].equals("-h")) || (s[0].equals("-help"))) {
|
|
|
|
help();
|
|
|
|
System.exit(0);
|
|
|
|
}
|
|
|
|
if (s[0].equals("-u")) {
|
|
|
|
if ((s.length < 2) || (s.length > 3)) {help(); System.exit(-1);}
|
|
|
|
String target;
|
|
|
|
if (s.length == 2) {
|
|
|
|
if (s[1].endsWith(".gz"))
|
|
|
|
target = s[1].substring(0, s[1].length() - 3);
|
|
|
|
else
|
|
|
|
target = s[1] + ".gunzip";
|
|
|
|
} else {
|
|
|
|
target = s[2];
|
|
|
|
}
|
|
|
|
gzip.gunzipFile(new File(s[1]), new File(target));
|
|
|
|
System.exit(0);
|
|
|
|
}
|
|
|
|
if ((s.length < 1) || (s.length > 2)) {help(); System.exit(-1);}
|
|
|
|
String target;
|
|
|
|
if (s.length == 1) target = s[0] + ".gz"; else target = s[1];
|
|
|
|
gzip.gzipFile((s[0]), target);
|
|
|
|
System.exit(0);
|
|
|
|
}
|
|
|
|
|
|
|
|
}
|