Allow comment characters (#) to be escaped:
[python/dscho.git] / Lib / chunk.py
blob231a59caff0423d9325385e66818f711b578d1ff
1 """Simple class to read IFF chunks.
3 An IFF chunk (used in formats such as AIFF, TIFF, RMFF (RealMedia File
4 Format)) has the following structure:
6 +----------------+
7 | ID (4 bytes) |
8 +----------------+
9 | size (4 bytes) |
10 +----------------+
11 | data |
12 | ... |
13 +----------------+
15 The ID is a 4-byte string which identifies the type of chunk.
17 The size field (a 32-bit value, encoded using big-endian byte order)
18 gives the size of the whole chunk, including the 8-byte header.
20 Usually an IFF-type file consists of one or more chunks. The proposed
21 usage of the Chunk class defined here is to instantiate an instance at
22 the start of each chunk and read from the instance until it reaches
23 the end, after which a new instance can be instantiated. At the end
24 of the file, creating a new instance will fail with a EOFError
25 exception.
27 Usage:
28 while 1:
29 try:
30 chunk = Chunk(file)
31 except EOFError:
32 break
33 chunktype = chunk.getname()
34 while 1:
35 data = chunk.read(nbytes)
36 if not data:
37 pass
38 # do something with data
40 The interface is file-like. The implemented methods are:
41 read, close, seek, tell, isatty.
42 Extra methods are: skip() (called by close, skips to the end of the chunk),
43 getname() (returns the name (ID) of the chunk)
45 The __init__ method has one required argument, a file-like object
46 (including a chunk instance), and one optional argument, a flag which
47 specifies whether or not chunks are aligned on 2-byte boundaries. The
48 default is 1, i.e. aligned.
49 """
51 class Chunk:
52 def __init__(self, file, align = 1):
53 import struct
54 self.closed = 0
55 self.align = align # whether to align to word (2-byte) boundaries
56 self.file = file
57 self.chunkname = file.read(4)
58 if len(self.chunkname) < 4:
59 raise EOFError
60 try:
61 self.chunksize = struct.unpack('>l', file.read(4))[0]
62 except struct.error:
63 raise EOFError
64 self.chunksize = self.chunksize - 8 # subtract header
65 self.size_read = 0
66 try:
67 self.offset = self.file.tell()
68 except:
69 self.seekable = 0
70 else:
71 self.seekable = 1
73 def getname(self):
74 """Return the name (ID) of the current chunk."""
75 return self.chunkname
77 def close(self):
78 if not self.closed:
79 self.skip()
80 self.closed = 1
82 def isatty(self):
83 if self.closed:
84 raise ValueError, "I/O operation on closed file"
85 return 0
87 def seek(self, pos, whence = 0):
88 """Seek to specified position into the chunk.
89 Default position is 0 (start of chunk).
90 If the file is not seekable, this will result in an error.
91 """
93 if self.closed:
94 raise ValueError, "I/O operation on closed file"
95 if not self.seekable:
96 raise IOError, "cannot seek"
97 if whence == 1:
98 pos = pos + self.size_read
99 elif whence == 2:
100 pos = pos + self.chunk_size
101 if pos < 0 or pos > self.chunksize:
102 raise RuntimeError
103 self.file.seek(self.offset + pos, 0)
104 self.size_read = pos
106 def tell(self):
107 if self.closed:
108 raise ValueError, "I/O operation on closed file"
109 return self.size_read
111 def read(self, size = -1):
112 """Read at most size bytes from the chunk.
113 If size is omitted or negative, read until the end
114 of the chunk.
117 if self.closed:
118 raise ValueError, "I/O operation on closed file"
119 if self.size_read >= self.chunksize:
120 return ''
121 if size < 0:
122 size = self.chunksize - self.size_read
123 if size > self.chunksize - self.size_read:
124 size = self.chunksize - self.size_read
125 data = self.file.read(size)
126 self.size_read = self.size_read + len(data)
127 if self.size_read == self.chunksize and \
128 self.align and \
129 (self.chunksize & 1):
130 dummy = self.file.read(1)
131 self.size_read = self.size_read + len(dummy)
132 return data
134 def skip(self):
135 """Skip the rest of the chunk.
136 If you are not interested in the contents of the chunk,
137 this method should be called so that the file points to
138 the start of the next chunk.
141 if self.closed:
142 raise ValueError, "I/O operation on closed file"
143 if self.seekable:
144 try:
145 n = self.chunksize - self.size_read
146 # maybe fix alignment
147 if self.align and (self.chunksize & 1):
148 n = n + 1
149 self.file.seek(n, 1)
150 self.size_read = self.size_read + n
151 return
152 except:
153 pass
154 while self.size_read < self.chunksize:
155 n = min(8192, self.chunksize - self.size_read)
156 dummy = self.read(n)
157 if not dummy:
158 raise EOFError