Skip to content

Commit 07eaea8

Browse files
eirbjojaikiran
andcommittedNov 14, 2023
8303920: Avoid calling out to python in DataDescriptorSignatureMissing test
Co-authored-by: Jaikiran Pai <jpai@openjdk.org> Reviewed-by: jpai, lancea, iris
1 parent fe0ccdf commit 07eaea8

File tree

1 file changed

+120
-106
lines changed

1 file changed

+120
-106
lines changed
 
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
/*
22
* Copyright 2012 Google, Inc. All Rights Reserved.
3+
* Copyright (c) 2023, Oracle and/or its affiliates. All rights reserved.
34
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
45
*
56
* This code is free software; you can redistribute it and/or modify it
@@ -24,124 +25,137 @@
2425
/**
2526
* @test
2627
* @bug 8056934
27-
* @summary Check ability to read zip files created by python zipfile
28-
* implementation, which fails to write optional (but recommended) data
29-
* descriptor signatures. Repro scenario is a Java -> Python -> Java round trip:
30-
* - ZipOutputStream creates zip file with DEFLATED entries and data
31-
* descriptors with optional signature "PK0x0708".
32-
* - Python reads those entries, preserving the 0x08 flag byte
33-
* - Python outputs those entries with data descriptors lacking the
34-
* optional signature.
35-
* - ZipInputStream cannot handle the missing signature
36-
*
28+
* @summary Verify the ability to read zip files whose local header
29+
* data descriptor is missing the optional signature
30+
* <p>
3731
* No way to adapt the technique in this test to get a ZIP64 zip file
3832
* without data descriptors was found.
39-
*
40-
* @ignore 8303920 This test has brittle dependencies on an external working python.
33+
* @run junit DataDescriptorSignatureMissing
4134
*/
4235

36+
37+
import org.junit.jupiter.api.Test;
38+
4339
import java.io.*;
40+
import java.nio.ByteBuffer;
41+
import java.nio.ByteOrder;
42+
import java.nio.charset.StandardCharsets;
4443
import java.util.zip.*;
4544

46-
public class DataDescriptorSignatureMissing {
47-
void printStream(InputStream is) throws IOException {
48-
Reader r = new InputStreamReader(is);
49-
StringBuilder sb = new StringBuilder();
50-
char[] buf = new char[1024];
51-
int n;
52-
while ((n = r.read(buf)) > 0) {
53-
sb.append(buf, 0, n);
54-
}
55-
System.out.print(sb);
56-
}
45+
import static org.junit.jupiter.api.Assertions.*;
46+
47+
public class DataDescriptorSignatureMissing {
48+
49+
/**
50+
* Verify that ZipInputStream correctly parses a ZIP with a Data Descriptor without
51+
* the recommended but optional signature.
52+
*/
53+
@Test
54+
public void shouldParseSignaturelessDescriptor() throws IOException {
55+
// The ZIP with a signature-less descriptor
56+
byte[] zip = makeZipWithSignaturelessDescriptor();
5757

58-
int entryCount(File zipFile) throws IOException {
59-
try (FileInputStream fis = new FileInputStream(zipFile);
60-
ZipInputStream zis = new ZipInputStream(fis)) {
61-
for (int count = 0;; count++)
62-
if (zis.getNextEntry() == null)
63-
return count;
58+
// ZipInputStream should read the signature-less data descriptor
59+
try (ZipInputStream in = new ZipInputStream(
60+
new ByteArrayInputStream(zip))) {
61+
ZipEntry first = in.getNextEntry();
62+
assertNotNull(first, "Zip file is unexpectedly missing first entry");
63+
assertEquals("first", first.getName());
64+
assertArrayEquals("first".getBytes(StandardCharsets.UTF_8), in.readAllBytes());
65+
66+
ZipEntry second = in.getNextEntry();
67+
assertNotNull(second, "Zip file is unexpectedly missing second entry");
68+
assertEquals("second", second.getName());
69+
assertArrayEquals("second".getBytes(StandardCharsets.UTF_8), in.readAllBytes());
6470
}
71+
6572
}
6673

67-
void test(String[] args) throws Throwable {
68-
if (! new File("/usr/bin/python").canExecute())
69-
return;
70-
71-
// Create a java zip file with DEFLATED entries and data
72-
// descriptors with signatures.
73-
final File in = new File("in.zip");
74-
final File out = new File("out.zip");
75-
final int count = 3;
76-
try (FileOutputStream fos = new FileOutputStream(in);
77-
ZipOutputStream zos = new ZipOutputStream(fos)) {
78-
for (int i = 0; i < count; i++) {
79-
ZipEntry ze = new ZipEntry("hello.python" + i);
80-
ze.setMethod(ZipEntry.DEFLATED);
81-
zos.putNextEntry(ze);
82-
zos.write(new byte[10]);
83-
zos.closeEntry();
84-
}
74+
/**
75+
* The 'Data descriptor' record is used to facilitate ZIP streaming. If the size of an
76+
* entry is unknown at the time the LOC header is written, bit 3 of the General Purpose Bit Flag
77+
* is set, and the File data is immediately followed by the 'Data descriptor' record. This record
78+
* then contains the compressed and uncompressed sizes of the entry and also the CRC value.
79+
*
80+
* The 'Data descriptor' record is usually preceded by the recommended, but optional
81+
* signature value 0x08074b50.
82+
*
83+
* A ZIP entry in streaming mode has the following structure:
84+
*
85+
* ------ Local File Header ------
86+
* 000000 signature 0x04034b50
87+
* 000004 version 20
88+
* 000006 flags 0x0808 # Notice bit 3 is set
89+
* [..] Omitted for brevity
90+
*
91+
* ------ File Data ------
92+
* 000035 data 7 bytes
93+
*
94+
* ------ Data Descriptor ------
95+
* 000042 signature 0x08074b50
96+
* 000046 crc 0x3610a686
97+
* 000050 csize 7
98+
* 000054 size 5
99+
*
100+
* A signature-less data descriptor will look like the following:
101+
*
102+
* ------ Data Descriptor ------
103+
* 000042 crc 0x3610a686
104+
* 000046 csize 7
105+
* 000050 size 5
106+
*
107+
* This method produces a ZIP with two entries, where the first entry
108+
* is made signature-less.
109+
*/
110+
private static byte[] makeZipWithSignaturelessDescriptor() throws IOException {
111+
// Offset of the signed data descriptor
112+
int sigOffset;
113+
114+
ByteArrayOutputStream out = new ByteArrayOutputStream();
115+
try (ZipOutputStream zo = new ZipOutputStream(out)) {
116+
// Write a first entry
117+
zo.putNextEntry(new ZipEntry("first"));
118+
zo.write("first".getBytes(StandardCharsets.UTF_8));
119+
// Force the data descriptor to be written out
120+
zo.closeEntry();
121+
// Signed data descriptor starts 16 bytes before current offset
122+
sigOffset = out.size() - 4 * Integer.BYTES;
123+
// Add a second entry
124+
zo.putNextEntry(new ZipEntry("second"));
125+
zo.write("second".getBytes(StandardCharsets.UTF_8));
85126
}
86127

87-
// Copy the zip file using python's zipfile module
88-
String[] python_program_lines = {
89-
"import os",
90-
"import zipfile",
91-
"input_zip = zipfile.ZipFile('in.zip', mode='r')",
92-
"output_zip = zipfile.ZipFile('out.zip', mode='w')",
93-
"count08 = 0",
94-
"for input_info in input_zip.infolist():",
95-
" output_info = input_info",
96-
" if output_info.flag_bits & 0x08 == 0x08:",
97-
" count08 += 1",
98-
" output_zip.writestr(output_info, input_zip.read(input_info))",
99-
"output_zip.close()",
100-
"if count08 == 0:",
101-
" raise ValueError('Expected to see entries with 0x08 flag_bits set')",
102-
};
103-
StringBuilder python_program_builder = new StringBuilder();
104-
for (String line : python_program_lines)
105-
python_program_builder.append(line).append('\n');
106-
String python_program = python_program_builder.toString();
107-
String[] cmdline = { "/usr/bin/python", "-c", python_program };
108-
ProcessBuilder pb = new ProcessBuilder(cmdline);
109-
pb.redirectErrorStream(true);
110-
Process p = pb.start();
111-
printStream(p.getInputStream());
112-
p.waitFor();
113-
equal(p.exitValue(), 0);
114-
115-
File pythonZipFile = new File("out.zip");
116-
check(pythonZipFile.exists());
117-
118-
equal(entryCount(in),
119-
entryCount(out));
120-
121-
// We expect out to be identical to in, except for the removal of
122-
// the optional data descriptor signatures.
123-
final int SIG_LENGTH = 4; // length of a zip signature - PKxx
124-
equal(in.length(),
125-
out.length() + SIG_LENGTH * count);
126-
127-
in.delete();
128-
out.delete();
129-
}
128+
// The generated ZIP file with a signed data descriptor
129+
byte[] sigZip = out.toByteArray();
130+
131+
// The offset of the CRC immediately following the 4-byte signature
132+
int crcOffset = sigOffset + Integer.BYTES;
133+
134+
// Create a ZIP file with a signature-less data descriptor for the first entry
135+
ByteArrayOutputStream sigLess = new ByteArrayOutputStream();
136+
sigLess.write(sigZip, 0, sigOffset);
137+
// Skip the signature
138+
sigLess.write(sigZip, crcOffset, sigZip.length - crcOffset);
139+
140+
byte[] siglessZip = sigLess.toByteArray();
130141

131-
//--------------------- Infrastructure ---------------------------
132-
volatile int passed = 0, failed = 0;
133-
void pass() {passed++;}
134-
void fail() {failed++; Thread.dumpStack();}
135-
void fail(String msg) {System.err.println(msg); fail();}
136-
void unexpected(Throwable t) {failed++; t.printStackTrace();}
137-
void check(boolean cond) {if (cond) pass(); else fail();}
138-
void equal(Object x, Object y) {
139-
if (x == null ? y == null : x.equals(y)) pass();
140-
else fail(x + " not equal to " + y);}
141-
public static void main(String[] args) throws Throwable {
142-
new DataDescriptorSignatureMissing().instanceMain(args);}
143-
public void instanceMain(String[] args) throws Throwable {
144-
try {test(args);} catch (Throwable t) {unexpected(t);}
145-
System.out.printf("%nPassed = %d, failed = %d%n%n", passed, failed);
146-
if (failed > 0) throw new AssertionError("Some tests failed");}
142+
// Adjust the CEN offset in the END header
143+
ByteBuffer buffer = ByteBuffer.wrap(siglessZip).order(ByteOrder.LITTLE_ENDIAN);
144+
// Reduce cenOffset by 4 bytes
145+
int cenOff = siglessZip.length - ZipFile.ENDHDR + ZipFile.ENDOFF;
146+
int realCenOff = buffer.getInt(cenOff) - Integer.BYTES;
147+
buffer.putInt(cenOff, realCenOff);
148+
149+
// Adjust the LOC offset in the second CEN header
150+
int cen = realCenOff;
151+
// Skip past the first CEN header
152+
int nlen = buffer.getShort(cen + ZipFile.CENNAM);
153+
cen += ZipFile.CENHDR + nlen;
154+
155+
// Reduce LOC offset by 4 bytes
156+
int locOff = cen + ZipFile.CENOFF;
157+
buffer.putInt(locOff, buffer.getInt(locOff) - Integer.BYTES);
158+
159+
return siglessZip;
160+
}
147161
}

0 commit comments

Comments
 (0)
Please sign in to comment.