Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 1 | import sys |
| 2 | import os |
| 3 | import shutil |
Brett Cannon | 455ea53 | 2003-06-12 08:01:06 +0000 | [diff] [blame] | 4 | import tempfile |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 5 | |
| 6 | import unittest |
| 7 | import tarfile |
| 8 | |
| 9 | from test import test_support |
| 10 | |
| 11 | # Check for our compression modules. |
| 12 | try: |
| 13 | import gzip |
Neal Norwitz | ae32319 | 2003-04-14 01:18:32 +0000 | [diff] [blame] | 14 | gzip.GzipFile |
| 15 | except (ImportError, AttributeError): |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 16 | gzip = None |
| 17 | try: |
| 18 | import bz2 |
| 19 | except ImportError: |
| 20 | bz2 = None |
| 21 | |
| 22 | def path(path): |
| 23 | return test_support.findfile(path) |
| 24 | |
Brett Cannon | 455ea53 | 2003-06-12 08:01:06 +0000 | [diff] [blame] | 25 | testtar = path("testtar.tar") |
| 26 | tempdir = os.path.join(tempfile.gettempdir(), "testtar" + os.extsep + "dir") |
| 27 | tempname = test_support.TESTFN |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 28 | membercount = 10 |
| 29 | |
| 30 | def tarname(comp=""): |
| 31 | if not comp: |
| 32 | return testtar |
Brett Cannon | 43e559a | 2003-06-12 19:16:58 +0000 | [diff] [blame] | 33 | return os.path.join(tempdir, "%s%s%s" % (testtar, os.extsep, comp)) |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 34 | |
| 35 | def dirname(): |
| 36 | if not os.path.exists(tempdir): |
| 37 | os.mkdir(tempdir) |
| 38 | return tempdir |
| 39 | |
| 40 | def tmpname(): |
| 41 | return tempname |
| 42 | |
| 43 | |
| 44 | class BaseTest(unittest.TestCase): |
| 45 | comp = '' |
| 46 | mode = 'r' |
| 47 | sep = ':' |
| 48 | |
| 49 | def setUp(self): |
| 50 | mode = self.mode + self.sep + self.comp |
| 51 | self.tar = tarfile.open(tarname(self.comp), mode) |
| 52 | |
| 53 | def tearDown(self): |
| 54 | self.tar.close() |
| 55 | |
| 56 | class ReadTest(BaseTest): |
| 57 | |
| 58 | def test(self): |
| 59 | """Test member extraction. |
| 60 | """ |
| 61 | members = 0 |
| 62 | for tarinfo in self.tar: |
| 63 | members += 1 |
| 64 | if not tarinfo.isreg(): |
| 65 | continue |
| 66 | f = self.tar.extractfile(tarinfo) |
| 67 | self.assert_(len(f.read()) == tarinfo.size, |
| 68 | "size read does not match expected size") |
| 69 | f.close() |
| 70 | |
| 71 | self.assert_(members == membercount, |
| 72 | "could not find all members") |
| 73 | |
| 74 | def test_sparse(self): |
| 75 | """Test sparse member extraction. |
| 76 | """ |
| 77 | if self.sep != "|": |
| 78 | f1 = self.tar.extractfile("S-SPARSE") |
Jack Jansen | 149a899 | 2003-03-07 13:27:53 +0000 | [diff] [blame] | 79 | f2 = self.tar.extractfile("S-SPARSE-WITH-NULLS") |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 80 | self.assert_(f1.read() == f2.read(), |
| 81 | "_FileObject failed on sparse file member") |
| 82 | |
| 83 | def test_readlines(self): |
| 84 | """Test readlines() method of _FileObject. |
| 85 | """ |
| 86 | if self.sep != "|": |
Jack Jansen | 149a899 | 2003-03-07 13:27:53 +0000 | [diff] [blame] | 87 | filename = "0-REGTYPE-TEXT" |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 88 | self.tar.extract(filename, dirname()) |
Jack Jansen | c7fcc2d | 2003-03-07 12:50:45 +0000 | [diff] [blame] | 89 | lines1 = file(os.path.join(dirname(), filename), "rU").readlines() |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 90 | lines2 = self.tar.extractfile(filename).readlines() |
| 91 | self.assert_(lines1 == lines2, |
| 92 | "_FileObject.readline() does not work correctly") |
| 93 | |
Martin v. Löwis | df24153 | 2005-03-03 08:17:42 +0000 | [diff] [blame] | 94 | def test_iter(self): |
| 95 | # Test iteration over ExFileObject. |
| 96 | if self.sep != "|": |
| 97 | filename = "0-REGTYPE-TEXT" |
| 98 | self.tar.extract(filename, dirname()) |
| 99 | lines1 = file(os.path.join(dirname(), filename), "rU").readlines() |
| 100 | lines2 = [line for line in self.tar.extractfile(filename)] |
| 101 | self.assert_(lines1 == lines2, |
| 102 | "ExFileObject iteration does not work correctly") |
| 103 | |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 104 | def test_seek(self): |
| 105 | """Test seek() method of _FileObject, incl. random reading. |
| 106 | """ |
| 107 | if self.sep != "|": |
Jack Jansen | 149a899 | 2003-03-07 13:27:53 +0000 | [diff] [blame] | 108 | filename = "0-REGTYPE" |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 109 | self.tar.extract(filename, dirname()) |
| 110 | data = file(os.path.join(dirname(), filename), "rb").read() |
| 111 | |
| 112 | tarinfo = self.tar.getmember(filename) |
| 113 | fobj = self.tar.extractfile(tarinfo) |
| 114 | |
| 115 | text = fobj.read() |
| 116 | fobj.seek(0) |
| 117 | self.assert_(0 == fobj.tell(), |
| 118 | "seek() to file's start failed") |
| 119 | fobj.seek(2048, 0) |
| 120 | self.assert_(2048 == fobj.tell(), |
| 121 | "seek() to absolute position failed") |
| 122 | fobj.seek(-1024, 1) |
| 123 | self.assert_(1024 == fobj.tell(), |
| 124 | "seek() to negative relative position failed") |
| 125 | fobj.seek(1024, 1) |
| 126 | self.assert_(2048 == fobj.tell(), |
| 127 | "seek() to positive relative position failed") |
| 128 | s = fobj.read(10) |
| 129 | self.assert_(s == data[2048:2058], |
| 130 | "read() after seek failed") |
| 131 | fobj.seek(0, 2) |
| 132 | self.assert_(tarinfo.size == fobj.tell(), |
| 133 | "seek() to file's end failed") |
| 134 | self.assert_(fobj.read() == "", |
| 135 | "read() at file's end did not return empty string") |
| 136 | fobj.seek(-tarinfo.size, 2) |
| 137 | self.assert_(0 == fobj.tell(), |
| 138 | "relative seek() to file's start failed") |
| 139 | fobj.seek(512) |
| 140 | s1 = fobj.readlines() |
| 141 | fobj.seek(512) |
| 142 | s2 = fobj.readlines() |
| 143 | self.assert_(s1 == s2, |
| 144 | "readlines() after seek failed") |
| 145 | fobj.close() |
| 146 | |
| 147 | class ReadStreamTest(ReadTest): |
| 148 | sep = "|" |
| 149 | |
| 150 | def test(self): |
| 151 | """Test member extraction, and for StreamError when |
| 152 | seeking backwards. |
| 153 | """ |
| 154 | ReadTest.test(self) |
| 155 | tarinfo = self.tar.getmembers()[0] |
| 156 | f = self.tar.extractfile(tarinfo) |
| 157 | self.assertRaises(tarfile.StreamError, f.read) |
| 158 | |
| 159 | def test_stream(self): |
| 160 | """Compare the normal tar and the stream tar. |
| 161 | """ |
| 162 | stream = self.tar |
| 163 | tar = tarfile.open(tarname(), 'r') |
| 164 | |
| 165 | while 1: |
| 166 | t1 = tar.next() |
| 167 | t2 = stream.next() |
| 168 | if t1 is None: |
| 169 | break |
| 170 | self.assert_(t2 is not None, "stream.next() failed.") |
| 171 | |
| 172 | if t2.islnk() or t2.issym(): |
| 173 | self.assertRaises(tarfile.StreamError, stream.extractfile, t2) |
| 174 | continue |
| 175 | v1 = tar.extractfile(t1) |
| 176 | v2 = stream.extractfile(t2) |
| 177 | if v1 is None: |
| 178 | continue |
| 179 | self.assert_(v2 is not None, "stream.extractfile() failed") |
| 180 | self.assert_(v1.read() == v2.read(), "stream extraction failed") |
| 181 | |
| 182 | stream.close() |
| 183 | |
Martin v. Löwis | 78be7df | 2005-03-05 12:47:42 +0000 | [diff] [blame] | 184 | class ReadAsteriskTest(ReadTest): |
| 185 | |
| 186 | def setUp(self): |
| 187 | mode = self.mode + self.sep + "*" |
| 188 | self.tar = tarfile.open(tarname(self.comp), mode) |
| 189 | |
| 190 | class ReadStreamAsteriskTest(ReadStreamTest): |
| 191 | |
| 192 | def setUp(self): |
| 193 | mode = self.mode + self.sep + "*" |
| 194 | self.tar = tarfile.open(tarname(self.comp), mode) |
| 195 | |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 196 | class WriteTest(BaseTest): |
| 197 | mode = 'w' |
| 198 | |
| 199 | def setUp(self): |
| 200 | mode = self.mode + self.sep + self.comp |
| 201 | self.src = tarfile.open(tarname(self.comp), 'r') |
Martin v. Löwis | c234a52 | 2004-08-22 21:28:33 +0000 | [diff] [blame] | 202 | self.dstname = tmpname() |
| 203 | self.dst = tarfile.open(self.dstname, mode) |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 204 | |
| 205 | def tearDown(self): |
| 206 | self.src.close() |
| 207 | self.dst.close() |
| 208 | |
| 209 | def test_posix(self): |
| 210 | self.dst.posix = 1 |
| 211 | self._test() |
| 212 | |
| 213 | def test_nonposix(self): |
| 214 | self.dst.posix = 0 |
| 215 | self._test() |
| 216 | |
Martin v. Löwis | c234a52 | 2004-08-22 21:28:33 +0000 | [diff] [blame] | 217 | def test_small(self): |
| 218 | self.dst.add(os.path.join(os.path.dirname(__file__),"cfgparser.1")) |
| 219 | self.dst.close() |
| 220 | self.assertNotEqual(os.stat(self.dstname).st_size, 0) |
| 221 | |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 222 | def _test(self): |
| 223 | for tarinfo in self.src: |
| 224 | if not tarinfo.isreg(): |
| 225 | continue |
| 226 | f = self.src.extractfile(tarinfo) |
| 227 | if self.dst.posix and len(tarinfo.name) > tarfile.LENGTH_NAME: |
| 228 | self.assertRaises(ValueError, self.dst.addfile, |
| 229 | tarinfo, f) |
| 230 | else: |
| 231 | self.dst.addfile(tarinfo, f) |
| 232 | |
| 233 | class WriteStreamTest(WriteTest): |
| 234 | sep = '|' |
| 235 | |
Neal Norwitz | 0662f8a | 2004-07-20 21:54:18 +0000 | [diff] [blame] | 236 | class WriteGNULongTest(unittest.TestCase): |
| 237 | """This testcase checks for correct creation of GNU Longname |
| 238 | and Longlink extensions. |
| 239 | |
| 240 | It creates a tarfile and adds empty members with either |
| 241 | long names, long linknames or both and compares the size |
| 242 | of the tarfile with the expected size. |
| 243 | |
| 244 | It checks for SF bug #812325 in TarFile._create_gnulong(). |
| 245 | |
| 246 | While I was writing this testcase, I noticed a second bug |
| 247 | in the same method: |
| 248 | Long{names,links} weren't null-terminated which lead to |
| 249 | bad tarfiles when their length was a multiple of 512. This |
| 250 | is tested as well. |
| 251 | """ |
| 252 | |
| 253 | def setUp(self): |
| 254 | self.tar = tarfile.open(tmpname(), "w") |
| 255 | self.tar.posix = False |
| 256 | |
| 257 | def tearDown(self): |
| 258 | self.tar.close() |
| 259 | |
| 260 | def _length(self, s): |
| 261 | blocks, remainder = divmod(len(s) + 1, 512) |
| 262 | if remainder: |
| 263 | blocks += 1 |
| 264 | return blocks * 512 |
| 265 | |
| 266 | def _calc_size(self, name, link=None): |
| 267 | # initial tar header |
| 268 | count = 512 |
| 269 | |
| 270 | if len(name) > tarfile.LENGTH_NAME: |
| 271 | # gnu longname extended header + longname |
| 272 | count += 512 |
| 273 | count += self._length(name) |
| 274 | |
| 275 | if link is not None and len(link) > tarfile.LENGTH_LINK: |
| 276 | # gnu longlink extended header + longlink |
| 277 | count += 512 |
| 278 | count += self._length(link) |
| 279 | |
| 280 | return count |
| 281 | |
| 282 | def _test(self, name, link=None): |
| 283 | tarinfo = tarfile.TarInfo(name) |
| 284 | if link: |
| 285 | tarinfo.linkname = link |
| 286 | tarinfo.type = tarfile.LNKTYPE |
| 287 | |
| 288 | self.tar.addfile(tarinfo) |
| 289 | |
| 290 | v1 = self._calc_size(name, link) |
| 291 | v2 = self.tar.offset |
| 292 | self.assertEqual(v1, v2, "GNU longname/longlink creation failed") |
| 293 | |
| 294 | def test_longname_1023(self): |
| 295 | self._test(("longnam/" * 127) + "longnam") |
| 296 | |
| 297 | def test_longname_1024(self): |
| 298 | self._test(("longnam/" * 127) + "longname") |
| 299 | |
| 300 | def test_longname_1025(self): |
| 301 | self._test(("longnam/" * 127) + "longname_") |
| 302 | |
| 303 | def test_longlink_1023(self): |
| 304 | self._test("name", ("longlnk/" * 127) + "longlnk") |
| 305 | |
| 306 | def test_longlink_1024(self): |
| 307 | self._test("name", ("longlnk/" * 127) + "longlink") |
| 308 | |
| 309 | def test_longlink_1025(self): |
| 310 | self._test("name", ("longlnk/" * 127) + "longlink_") |
| 311 | |
| 312 | def test_longnamelink_1023(self): |
| 313 | self._test(("longnam/" * 127) + "longnam", |
| 314 | ("longlnk/" * 127) + "longlnk") |
| 315 | |
| 316 | def test_longnamelink_1024(self): |
| 317 | self._test(("longnam/" * 127) + "longname", |
| 318 | ("longlnk/" * 127) + "longlink") |
| 319 | |
| 320 | def test_longnamelink_1025(self): |
| 321 | self._test(("longnam/" * 127) + "longname_", |
| 322 | ("longlnk/" * 127) + "longlink_") |
| 323 | |
Neal Norwitz | a4f651a | 2004-07-20 22:07:44 +0000 | [diff] [blame] | 324 | class ExtractHardlinkTest(BaseTest): |
| 325 | |
| 326 | def test_hardlink(self): |
| 327 | """Test hardlink extraction (bug #857297) |
| 328 | """ |
| 329 | # Prevent errors from being caught |
| 330 | self.tar.errorlevel = 1 |
| 331 | |
| 332 | self.tar.extract("0-REGTYPE", dirname()) |
| 333 | try: |
| 334 | # Extract 1-LNKTYPE which is a hardlink to 0-REGTYPE |
| 335 | self.tar.extract("1-LNKTYPE", dirname()) |
| 336 | except EnvironmentError, e: |
| 337 | import errno |
| 338 | if e.errno == errno.ENOENT: |
| 339 | self.fail("hardlink not extracted properly") |
| 340 | |
| 341 | |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 342 | # Gzip TestCases |
| 343 | class ReadTestGzip(ReadTest): |
| 344 | comp = "gz" |
| 345 | class ReadStreamTestGzip(ReadStreamTest): |
| 346 | comp = "gz" |
| 347 | class WriteTestGzip(WriteTest): |
| 348 | comp = "gz" |
| 349 | class WriteStreamTestGzip(WriteStreamTest): |
| 350 | comp = "gz" |
Martin v. Löwis | 78be7df | 2005-03-05 12:47:42 +0000 | [diff] [blame] | 351 | class ReadAsteriskTestGzip(ReadAsteriskTest): |
| 352 | comp = "gz" |
| 353 | class ReadStreamAsteriskTestGzip(ReadStreamAsteriskTest): |
| 354 | comp = "gz" |
| 355 | |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 356 | |
Andrew M. Kuchling | d4f2552 | 2004-10-20 11:47:01 +0000 | [diff] [blame] | 357 | # Filemode test cases |
| 358 | |
| 359 | class FileModeTest(unittest.TestCase): |
| 360 | def test_modes(self): |
| 361 | self.assertEqual(tarfile.filemode(0755), '-rwxr-xr-x') |
| 362 | self.assertEqual(tarfile.filemode(07111), '---s--s--t') |
| 363 | |
Tim Peters | 8ceefc5 | 2004-10-25 03:19:41 +0000 | [diff] [blame] | 364 | |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 365 | if bz2: |
| 366 | # Bzip2 TestCases |
| 367 | class ReadTestBzip2(ReadTestGzip): |
| 368 | comp = "bz2" |
| 369 | class ReadStreamTestBzip2(ReadStreamTestGzip): |
| 370 | comp = "bz2" |
| 371 | class WriteTestBzip2(WriteTest): |
| 372 | comp = "bz2" |
| 373 | class WriteStreamTestBzip2(WriteStreamTestGzip): |
| 374 | comp = "bz2" |
Martin v. Löwis | 78be7df | 2005-03-05 12:47:42 +0000 | [diff] [blame] | 375 | class ReadAsteriskTestBzip2(ReadAsteriskTest): |
| 376 | comp = "bz2" |
| 377 | class ReadStreamAsteriskTestBzip2(ReadStreamAsteriskTest): |
| 378 | comp = "bz2" |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 379 | |
| 380 | # If importing gzip failed, discard the Gzip TestCases. |
| 381 | if not gzip: |
| 382 | del ReadTestGzip |
| 383 | del ReadStreamTestGzip |
| 384 | del WriteTestGzip |
| 385 | del WriteStreamTestGzip |
| 386 | |
Neal Norwitz | 996acf1 | 2003-02-17 14:51:41 +0000 | [diff] [blame] | 387 | def test_main(): |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 388 | if gzip: |
| 389 | # create testtar.tar.gz |
| 390 | gzip.open(tarname("gz"), "wb").write(file(tarname(), "rb").read()) |
| 391 | if bz2: |
| 392 | # create testtar.tar.bz2 |
| 393 | bz2.BZ2File(tarname("bz2"), "wb").write(file(tarname(), "rb").read()) |
| 394 | |
Walter Dörwald | 21d3a32 | 2003-05-01 17:45:56 +0000 | [diff] [blame] | 395 | tests = [ |
Andrew M. Kuchling | d4f2552 | 2004-10-20 11:47:01 +0000 | [diff] [blame] | 396 | FileModeTest, |
Walter Dörwald | 21d3a32 | 2003-05-01 17:45:56 +0000 | [diff] [blame] | 397 | ReadTest, |
| 398 | ReadStreamTest, |
Martin v. Löwis | 78be7df | 2005-03-05 12:47:42 +0000 | [diff] [blame] | 399 | ReadAsteriskTest, |
| 400 | ReadStreamAsteriskTest, |
Walter Dörwald | 21d3a32 | 2003-05-01 17:45:56 +0000 | [diff] [blame] | 401 | WriteTest, |
Neal Norwitz | 0662f8a | 2004-07-20 21:54:18 +0000 | [diff] [blame] | 402 | WriteStreamTest, |
| 403 | WriteGNULongTest, |
Walter Dörwald | 21d3a32 | 2003-05-01 17:45:56 +0000 | [diff] [blame] | 404 | ] |
| 405 | |
Neal Norwitz | a4f651a | 2004-07-20 22:07:44 +0000 | [diff] [blame] | 406 | if hasattr(os, "link"): |
| 407 | tests.append(ExtractHardlinkTest) |
| 408 | |
Walter Dörwald | 21d3a32 | 2003-05-01 17:45:56 +0000 | [diff] [blame] | 409 | if gzip: |
| 410 | tests.extend([ |
| 411 | ReadTestGzip, ReadStreamTestGzip, |
Martin v. Löwis | 78be7df | 2005-03-05 12:47:42 +0000 | [diff] [blame] | 412 | WriteTestGzip, WriteStreamTestGzip, |
| 413 | ReadAsteriskTestGzip, ReadStreamAsteriskTestGzip |
Walter Dörwald | 21d3a32 | 2003-05-01 17:45:56 +0000 | [diff] [blame] | 414 | ]) |
| 415 | |
| 416 | if bz2: |
| 417 | tests.extend([ |
| 418 | ReadTestBzip2, ReadStreamTestBzip2, |
Martin v. Löwis | 78be7df | 2005-03-05 12:47:42 +0000 | [diff] [blame] | 419 | WriteTestBzip2, WriteStreamTestBzip2, |
| 420 | ReadAsteriskTestBzip2, ReadStreamAsteriskTestBzip2 |
Walter Dörwald | 21d3a32 | 2003-05-01 17:45:56 +0000 | [diff] [blame] | 421 | ]) |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 422 | try: |
Walter Dörwald | 21d3a32 | 2003-05-01 17:45:56 +0000 | [diff] [blame] | 423 | test_support.run_unittest(*tests) |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 424 | finally: |
| 425 | if gzip: |
| 426 | os.remove(tarname("gz")) |
| 427 | if bz2: |
| 428 | os.remove(tarname("bz2")) |
Brett Cannon | 455ea53 | 2003-06-12 08:01:06 +0000 | [diff] [blame] | 429 | if os.path.exists(dirname()): |
| 430 | shutil.rmtree(dirname()) |
| 431 | if os.path.exists(tmpname()): |
| 432 | os.remove(tmpname()) |
Neal Norwitz | b9ef4ae | 2003-01-05 23:19:43 +0000 | [diff] [blame] | 433 | |
Neal Norwitz | 996acf1 | 2003-02-17 14:51:41 +0000 | [diff] [blame] | 434 | if __name__ == "__main__": |
| 435 | test_main() |