source: josm/trunk/src/org/tukaani/xz/XZOutputStream.java@ 15851

Last change on this file since 15851 was 13350, checked in by stoecker, 7 years ago

see #15816 - add XZ support

File size: 21.6 KB
Line 
1/*
2 * XZOutputStream
3 *
4 * Author: Lasse Collin <lasse.collin@tukaani.org>
5 *
6 * This file has been put into the public domain.
7 * You can do whatever you want with this file.
8 */
9
10package org.tukaani.xz;
11
12import java.io.OutputStream;
13import java.io.IOException;
14import org.tukaani.xz.common.EncoderUtil;
15import org.tukaani.xz.common.StreamFlags;
16import org.tukaani.xz.check.Check;
17import org.tukaani.xz.index.IndexEncoder;
18
19/**
20 * Compresses into the .xz file format.
21 *
22 * <h4>Examples</h4>
23 * <p>
24 * Getting an output stream to compress with LZMA2 using the default
25 * settings and the default integrity check type (CRC64):
26 * <p><blockquote><pre>
27 * FileOutputStream outfile = new FileOutputStream("foo.xz");
28 * XZOutputStream outxz = new XZOutputStream(outfile, new LZMA2Options());
29 * </pre></blockquote>
30 * <p>
31 * Using the preset level <code>8</code> for LZMA2 (the default
32 * is <code>6</code>) and SHA-256 instead of CRC64 for integrity checking:
33 * <p><blockquote><pre>
34 * XZOutputStream outxz = new XZOutputStream(outfile, new LZMA2Options(8),
35 * XZ.CHECK_SHA256);
36 * </pre></blockquote>
37 * <p>
38 * Using the x86 BCJ filter together with LZMA2 to compress x86 executables
39 * and printing the memory usage information before creating the
40 * XZOutputStream:
41 * <p><blockquote><pre>
42 * X86Options x86 = new X86Options();
43 * LZMA2Options lzma2 = new LZMA2Options();
44 * FilterOptions[] options = { x86, lzma2 };
45 * System.out.println("Encoder memory usage: "
46 * + FilterOptions.getEncoderMemoryUsage(options)
47 * + " KiB");
48 * System.out.println("Decoder memory usage: "
49 * + FilterOptions.getDecoderMemoryUsage(options)
50 * + " KiB");
51 * XZOutputStream outxz = new XZOutputStream(outfile, options);
52 * </pre></blockquote>
53 */
54public class XZOutputStream extends FinishableOutputStream {
55 private final ArrayCache arrayCache;
56
57 private OutputStream out;
58 private final StreamFlags streamFlags = new StreamFlags();
59 private final Check check;
60 private final IndexEncoder index = new IndexEncoder();
61
62 private BlockOutputStream blockEncoder = null;
63 private FilterEncoder[] filters;
64
65 /**
66 * True if the current filter chain supports flushing.
67 * If it doesn't support flushing, <code>flush()</code>
68 * will use <code>endBlock()</code> as a fallback.
69 */
70 private boolean filtersSupportFlushing;
71
72 private IOException exception = null;
73 private boolean finished = false;
74
75 private final byte[] tempBuf = new byte[1];
76
77 /**
78 * Creates a new XZ compressor using one filter and CRC64 as
79 * the integrity check. This constructor is equivalent to passing
80 * a single-member FilterOptions array to
81 * <code>XZOutputStream(OutputStream, FilterOptions[])</code>.
82 *
83 * @param out output stream to which the compressed data
84 * will be written
85 *
86 * @param filterOptions
87 * filter options to use
88 *
89 * @throws UnsupportedOptionsException
90 * invalid filter chain
91 *
92 * @throws IOException may be thrown from <code>out</code>
93 */
94 public XZOutputStream(OutputStream out, FilterOptions filterOptions)
95 throws IOException {
96 this(out, filterOptions, XZ.CHECK_CRC64);
97 }
98
99 /**
100 * Creates a new XZ compressor using one filter and CRC64 as
101 * the integrity check. This constructor is equivalent to passing
102 * a single-member FilterOptions array to
103 * <code>XZOutputStream(OutputStream, FilterOptions[], ArrayCache)</code>.
104 *
105 * @param out output stream to which the compressed data
106 * will be written
107 *
108 * @param filterOptions
109 * filter options to use
110 *
111 * @param arrayCache cache to be used for allocating large arrays
112 *
113 * @throws UnsupportedOptionsException
114 * invalid filter chain
115 *
116 * @throws IOException may be thrown from <code>out</code>
117 *
118 * @since 1.7
119 */
120 public XZOutputStream(OutputStream out, FilterOptions filterOptions,
121 ArrayCache arrayCache)
122 throws IOException {
123 this(out, filterOptions, XZ.CHECK_CRC64, arrayCache);
124 }
125
126 /**
127 * Creates a new XZ compressor using one filter and the specified
128 * integrity check type. This constructor is equivalent to
129 * passing a single-member FilterOptions array to
130 * <code>XZOutputStream(OutputStream, FilterOptions[], int)</code>.
131 *
132 * @param out output stream to which the compressed data
133 * will be written
134 *
135 * @param filterOptions
136 * filter options to use
137 *
138 * @param checkType type of the integrity check,
139 * for example XZ.CHECK_CRC32
140 *
141 * @throws UnsupportedOptionsException
142 * invalid filter chain
143 *
144 * @throws IOException may be thrown from <code>out</code>
145 */
146 public XZOutputStream(OutputStream out, FilterOptions filterOptions,
147 int checkType) throws IOException {
148 this(out, new FilterOptions[] { filterOptions }, checkType);
149 }
150
151 /**
152 * Creates a new XZ compressor using one filter and the specified
153 * integrity check type. This constructor is equivalent to
154 * passing a single-member FilterOptions array to
155 * <code>XZOutputStream(OutputStream, FilterOptions[], int,
156 * ArrayCache)</code>.
157 *
158 * @param out output stream to which the compressed data
159 * will be written
160 *
161 * @param filterOptions
162 * filter options to use
163 *
164 * @param checkType type of the integrity check,
165 * for example XZ.CHECK_CRC32
166 *
167 * @param arrayCache cache to be used for allocating large arrays
168 *
169 * @throws UnsupportedOptionsException
170 * invalid filter chain
171 *
172 * @throws IOException may be thrown from <code>out</code>
173 *
174 * @since 1.7
175 */
176 public XZOutputStream(OutputStream out, FilterOptions filterOptions,
177 int checkType, ArrayCache arrayCache)
178 throws IOException {
179 this(out, new FilterOptions[] { filterOptions }, checkType,
180 arrayCache);
181 }
182
183 /**
184 * Creates a new XZ compressor using 1-4 filters and CRC64 as
185 * the integrity check. This constructor is equivalent
186 * <code>XZOutputStream(out, filterOptions, XZ.CHECK_CRC64)</code>.
187 *
188 * @param out output stream to which the compressed data
189 * will be written
190 *
191 * @param filterOptions
192 * array of filter options to use
193 *
194 * @throws UnsupportedOptionsException
195 * invalid filter chain
196 *
197 * @throws IOException may be thrown from <code>out</code>
198 */
199 public XZOutputStream(OutputStream out, FilterOptions[] filterOptions)
200 throws IOException {
201 this(out, filterOptions, XZ.CHECK_CRC64);
202 }
203
204 /**
205 * Creates a new XZ compressor using 1-4 filters and CRC64 as
206 * the integrity check. This constructor is equivalent
207 * <code>XZOutputStream(out, filterOptions, XZ.CHECK_CRC64,
208 * arrayCache)</code>.
209 *
210 * @param out output stream to which the compressed data
211 * will be written
212 *
213 * @param filterOptions
214 * array of filter options to use
215 *
216 * @param arrayCache cache to be used for allocating large arrays
217 *
218 * @throws UnsupportedOptionsException
219 * invalid filter chain
220 *
221 * @throws IOException may be thrown from <code>out</code>
222 *
223 * @since 1.7
224 */
225 public XZOutputStream(OutputStream out, FilterOptions[] filterOptions,
226 ArrayCache arrayCache)
227 throws IOException {
228 this(out, filterOptions, XZ.CHECK_CRC64, arrayCache);
229 }
230
231 /**
232 * Creates a new XZ compressor using 1-4 filters and the specified
233 * integrity check type.
234 *
235 * @param out output stream to which the compressed data
236 * will be written
237 *
238 * @param filterOptions
239 * array of filter options to use
240 *
241 * @param checkType type of the integrity check,
242 * for example XZ.CHECK_CRC32
243 *
244 * @throws UnsupportedOptionsException
245 * invalid filter chain
246 *
247 * @throws IOException may be thrown from <code>out</code>
248 */
249 public XZOutputStream(OutputStream out, FilterOptions[] filterOptions,
250 int checkType) throws IOException {
251 this(out, filterOptions, checkType, ArrayCache.getDefaultCache());
252 }
253
254 /**
255 * Creates a new XZ compressor using 1-4 filters and the specified
256 * integrity check type.
257 *
258 * @param out output stream to which the compressed data
259 * will be written
260 *
261 * @param filterOptions
262 * array of filter options to use
263 *
264 * @param checkType type of the integrity check,
265 * for example XZ.CHECK_CRC32
266 *
267 * @param arrayCache cache to be used for allocating large arrays
268 *
269 * @throws UnsupportedOptionsException
270 * invalid filter chain
271 *
272 * @throws IOException may be thrown from <code>out</code>
273 *
274 * @since 1.7
275 */
276 public XZOutputStream(OutputStream out, FilterOptions[] filterOptions,
277 int checkType, ArrayCache arrayCache)
278 throws IOException {
279 this.arrayCache = arrayCache;
280 this.out = out;
281 updateFilters(filterOptions);
282
283 streamFlags.checkType = checkType;
284 check = Check.getInstance(checkType);
285
286 encodeStreamHeader();
287 }
288
289 /**
290 * Updates the filter chain with a single filter.
291 * This is equivalent to passing a single-member FilterOptions array
292 * to <code>updateFilters(FilterOptions[])</code>.
293 *
294 * @param filterOptions
295 * new filter to use
296 *
297 * @throws UnsupportedOptionsException
298 * unsupported filter chain, or trying to change
299 * the filter chain in the middle of a Block
300 */
301 public void updateFilters(FilterOptions filterOptions)
302 throws XZIOException {
303 FilterOptions[] opts = new FilterOptions[1];
304 opts[0] = filterOptions;
305 updateFilters(opts);
306 }
307
308 /**
309 * Updates the filter chain with 1-4 filters.
310 * <p>
311 * Currently this cannot be used to update e.g. LZMA2 options in the
312 * middle of a XZ Block. Use <code>endBlock()</code> to finish the
313 * current XZ Block before calling this function. The new filter chain
314 * will then be used for the next XZ Block.
315 *
316 * @param filterOptions
317 * new filter chain to use
318 *
319 * @throws UnsupportedOptionsException
320 * unsupported filter chain, or trying to change
321 * the filter chain in the middle of a Block
322 */
323 public void updateFilters(FilterOptions[] filterOptions)
324 throws XZIOException {
325 if (blockEncoder != null)
326 throw new UnsupportedOptionsException("Changing filter options "
327 + "in the middle of a XZ Block not implemented");
328
329 if (filterOptions.length < 1 || filterOptions.length > 4)
330 throw new UnsupportedOptionsException(
331 "XZ filter chain must be 1-4 filters");
332
333 filtersSupportFlushing = true;
334 FilterEncoder[] newFilters = new FilterEncoder[filterOptions.length];
335 for (int i = 0; i < filterOptions.length; ++i) {
336 newFilters[i] = filterOptions[i].getFilterEncoder();
337 filtersSupportFlushing &= newFilters[i].supportsFlushing();
338 }
339
340 RawCoder.validate(newFilters);
341 filters = newFilters;
342 }
343
344 /**
345 * Writes one byte to be compressed.
346 *
347 * @throws XZIOException
348 * XZ Stream has grown too big
349 *
350 * @throws XZIOException
351 * <code>finish()</code> or <code>close()</code>
352 * was already called
353 *
354 * @throws IOException may be thrown by the underlying output stream
355 */
356 public void write(int b) throws IOException {
357 tempBuf[0] = (byte)b;
358 write(tempBuf, 0, 1);
359 }
360
361 /**
362 * Writes an array of bytes to be compressed.
363 * The compressors tend to do internal buffering and thus the written
364 * data won't be readable from the compressed output immediately.
365 * Use <code>flush()</code> to force everything written so far to
366 * be written to the underlaying output stream, but be aware that
367 * flushing reduces compression ratio.
368 *
369 * @param buf buffer of bytes to be written
370 * @param off start offset in <code>buf</code>
371 * @param len number of bytes to write
372 *
373 * @throws XZIOException
374 * XZ Stream has grown too big: total file size
375 * about 8&nbsp;EiB or the Index field exceeds
376 * 16&nbsp;GiB; you shouldn't reach these sizes
377 * in practice
378 *
379 * @throws XZIOException
380 * <code>finish()</code> or <code>close()</code>
381 * was already called and len &gt; 0
382 *
383 * @throws IOException may be thrown by the underlying output stream
384 */
385 public void write(byte[] buf, int off, int len) throws IOException {
386 if (off < 0 || len < 0 || off + len < 0 || off + len > buf.length)
387 throw new IndexOutOfBoundsException();
388
389 if (exception != null)
390 throw exception;
391
392 if (finished)
393 throw new XZIOException("Stream finished or closed");
394
395 try {
396 if (blockEncoder == null)
397 blockEncoder = new BlockOutputStream(out, filters, check,
398 arrayCache);
399
400 blockEncoder.write(buf, off, len);
401 } catch (IOException e) {
402 exception = e;
403 throw e;
404 }
405 }
406
407 /**
408 * Finishes the current XZ Block (but not the whole XZ Stream).
409 * This doesn't flush the stream so it's possible that not all data will
410 * be decompressible from the output stream when this function returns.
411 * Call also <code>flush()</code> if flushing is wanted in addition to
412 * finishing the current XZ Block.
413 * <p>
414 * If there is no unfinished Block open, this function will do nothing.
415 * (No empty XZ Block will be created.)
416 * <p>
417 * This function can be useful, for example, to create
418 * random-accessible .xz files.
419 * <p>
420 * Starting a new XZ Block means that the encoder state is reset.
421 * Doing this very often will increase the size of the compressed
422 * file a lot (more than plain <code>flush()</code> would do).
423 *
424 * @throws XZIOException
425 * XZ Stream has grown too big
426 *
427 * @throws XZIOException
428 * stream finished or closed
429 *
430 * @throws IOException may be thrown by the underlying output stream
431 */
432 public void endBlock() throws IOException {
433 if (exception != null)
434 throw exception;
435
436 if (finished)
437 throw new XZIOException("Stream finished or closed");
438
439 // NOTE: Once there is threading with multiple Blocks, it's possible
440 // that this function will be more like a barrier that returns
441 // before the last Block has been finished.
442 if (blockEncoder != null) {
443 try {
444 blockEncoder.finish();
445 index.add(blockEncoder.getUnpaddedSize(),
446 blockEncoder.getUncompressedSize());
447 blockEncoder = null;
448 } catch (IOException e) {
449 exception = e;
450 throw e;
451 }
452 }
453 }
454
455 /**
456 * Flushes the encoder and calls <code>out.flush()</code>.
457 * All buffered pending data will then be decompressible from
458 * the output stream.
459 * <p>
460 * Calling this function very often may increase the compressed
461 * file size a lot. The filter chain options may affect the size
462 * increase too. For example, with LZMA2 the HC4 match finder has
463 * smaller penalty with flushing than BT4.
464 * <p>
465 * Some filters don't support flushing. If the filter chain has
466 * such a filter, <code>flush()</code> will call <code>endBlock()</code>
467 * before flushing.
468 *
469 * @throws XZIOException
470 * XZ Stream has grown too big
471 *
472 * @throws XZIOException
473 * stream finished or closed
474 *
475 * @throws IOException may be thrown by the underlying output stream
476 */
477 public void flush() throws IOException {
478 if (exception != null)
479 throw exception;
480
481 if (finished)
482 throw new XZIOException("Stream finished or closed");
483
484 try {
485 if (blockEncoder != null) {
486 if (filtersSupportFlushing) {
487 // This will eventually call out.flush() so
488 // no need to do it here again.
489 blockEncoder.flush();
490 } else {
491 endBlock();
492 out.flush();
493 }
494 } else {
495 out.flush();
496 }
497 } catch (IOException e) {
498 exception = e;
499 throw e;
500 }
501 }
502
503 /**
504 * Finishes compression without closing the underlying stream.
505 * No more data can be written to this stream after finishing
506 * (calling <code>write</code> with an empty buffer is OK).
507 * <p>
508 * Repeated calls to <code>finish()</code> do nothing unless
509 * an exception was thrown by this stream earlier. In that case
510 * the same exception is thrown again.
511 * <p>
512 * After finishing, the stream may be closed normally with
513 * <code>close()</code>. If the stream will be closed anyway, there
514 * usually is no need to call <code>finish()</code> separately.
515 *
516 * @throws XZIOException
517 * XZ Stream has grown too big
518 *
519 * @throws IOException may be thrown by the underlying output stream
520 */
521 public void finish() throws IOException {
522 if (!finished) {
523 // This checks for pending exceptions so we don't need to
524 // worry about it here.
525 endBlock();
526
527 try {
528 index.encode(out);
529 encodeStreamFooter();
530 } catch (IOException e) {
531 exception = e;
532 throw e;
533 }
534
535 // Set it to true only if everything goes fine. Setting it earlier
536 // would cause repeated calls to finish() do nothing instead of
537 // throwing an exception to indicate an earlier error.
538 finished = true;
539 }
540 }
541
542 /**
543 * Finishes compression and closes the underlying stream.
544 * The underlying stream <code>out</code> is closed even if finishing
545 * fails. If both finishing and closing fail, the exception thrown
546 * by <code>finish()</code> is thrown and the exception from the failed
547 * <code>out.close()</code> is lost.
548 *
549 * @throws XZIOException
550 * XZ Stream has grown too big
551 *
552 * @throws IOException may be thrown by the underlying output stream
553 */
554 public void close() throws IOException {
555 if (out != null) {
556 // If finish() throws an exception, it stores the exception to
557 // the variable "exception". So we can ignore the possible
558 // exception here.
559 try {
560 finish();
561 } catch (IOException e) {}
562
563 try {
564 out.close();
565 } catch (IOException e) {
566 // Remember the exception but only if there is no previous
567 // pending exception.
568 if (exception == null)
569 exception = e;
570 }
571
572 out = null;
573 }
574
575 if (exception != null)
576 throw exception;
577 }
578
579 private void encodeStreamFlags(byte[] buf, int off) {
580 buf[off] = 0x00;
581 buf[off + 1] = (byte)streamFlags.checkType;
582 }
583
584 private void encodeStreamHeader() throws IOException {
585 out.write(XZ.HEADER_MAGIC);
586
587 byte[] buf = new byte[2];
588 encodeStreamFlags(buf, 0);
589 out.write(buf);
590
591 EncoderUtil.writeCRC32(out, buf);
592 }
593
594 private void encodeStreamFooter() throws IOException {
595 byte[] buf = new byte[6];
596 long backwardSize = index.getIndexSize() / 4 - 1;
597 for (int i = 0; i < 4; ++i)
598 buf[i] = (byte)(backwardSize >>> (i * 8));
599
600 encodeStreamFlags(buf, 4);
601
602 EncoderUtil.writeCRC32(out, buf);
603 out.write(buf);
604 out.write(XZ.FOOTER_MAGIC);
605 }
606}
Note: See TracBrowser for help on using the repository browser.