blob: 839b37aac4e4d31a1aff8967ee261ac9c5284bc6 [file] [log] [blame]
Russ Coxad17a9c2012-02-18 21:02:41 -05001// Copyright 2009 The Go Authors. All rights reserved.
2// Use of this source code is governed by a BSD-style
3// license that can be found in the LICENSE file.
4
5// Parse "zoneinfo" time zone file.
6// This is a fairly standard file format used on OS X, Linux, BSD, Sun, and others.
7// See tzfile(5), http://en.wikipedia.org/wiki/Zoneinfo,
8// and ftp://munnari.oz.au/pub/oldtz/
9
10package time
11
Florian Uekermann7340d132017-09-18 19:22:29 +020012import (
13 "errors"
14 "syscall"
15)
Russ Coxad17a9c2012-02-18 21:02:41 -050016
Brad Fitzpatrickbd561692017-02-07 23:15:24 +000017// maxFileSize is the max permitted size of files read by readFile.
18// As reference, the zoneinfo.zip distributed by Go is ~350 KB,
19// so 10MB is overkill.
20const maxFileSize = 10 << 20
21
22type fileSizeError string
23
24func (f fileSizeError) Error() string {
25 return "time: file " + string(f) + " is too large"
26}
27
Brad Fitzpatrickd88261f2016-05-09 17:21:11 +000028// Copies of io.Seek* constants to avoid importing "io":
29const (
30 seekStart = 0
31 seekCurrent = 1
32 seekEnd = 2
33)
34
Russ Coxad17a9c2012-02-18 21:02:41 -050035// Simple I/O interface to binary blob of data.
Russ Cox225a2e12017-11-21 10:09:05 -050036type dataIO struct {
Russ Coxad17a9c2012-02-18 21:02:41 -050037 p []byte
38 error bool
39}
40
Russ Cox225a2e12017-11-21 10:09:05 -050041func (d *dataIO) read(n int) []byte {
Russ Coxad17a9c2012-02-18 21:02:41 -050042 if len(d.p) < n {
43 d.p = nil
44 d.error = true
45 return nil
46 }
47 p := d.p[0:n]
48 d.p = d.p[n:]
49 return p
50}
51
Russ Cox225a2e12017-11-21 10:09:05 -050052func (d *dataIO) big4() (n uint32, ok bool) {
Russ Coxad17a9c2012-02-18 21:02:41 -050053 p := d.read(4)
54 if len(p) < 4 {
55 d.error = true
56 return 0, false
57 }
58 return uint32(p[0])<<24 | uint32(p[1])<<16 | uint32(p[2])<<8 | uint32(p[3]), true
59}
60
Russ Cox225a2e12017-11-21 10:09:05 -050061func (d *dataIO) byte() (n byte, ok bool) {
Russ Coxad17a9c2012-02-18 21:02:41 -050062 p := d.read(1)
63 if len(p) < 1 {
64 d.error = true
65 return 0, false
66 }
67 return p[0], true
68}
69
70// Make a string by stopping at the first NUL
71func byteString(p []byte) string {
72 for i := 0; i < len(p); i++ {
73 if p[i] == 0 {
74 return string(p[0:i])
75 }
76 }
77 return string(p)
78}
79
80var badData = errors.New("malformed time zone information")
81
Florian Uekermann2951f902017-10-06 17:16:43 +020082// LoadLocationFromTZData returns a Location with the given name
83// initialized from the IANA Time Zone database-formatted data.
84// The data should be in the format of a standard IANA time zone file
85// (for example, the content of /etc/localtime on Unix systems).
86func LoadLocationFromTZData(name string, data []byte) (*Location, error) {
87 d := dataIO{data, false}
Russ Coxad17a9c2012-02-18 21:02:41 -050088
89 // 4-byte magic "TZif"
90 if magic := d.read(4); string(magic) != "TZif" {
91 return nil, badData
92 }
93
94 // 1-byte version, then 15 bytes of padding
95 var p []byte
Brad Fitzpatrick14a75ec2014-06-03 11:44:17 +090096 if p = d.read(16); len(p) != 16 || p[0] != 0 && p[0] != '2' && p[0] != '3' {
Russ Coxad17a9c2012-02-18 21:02:41 -050097 return nil, badData
98 }
99
100 // six big-endian 32-bit integers:
101 // number of UTC/local indicators
102 // number of standard/wall indicators
103 // number of leap seconds
104 // number of transition times
105 // number of local time zones
106 // number of characters of time zone abbrev strings
107 const (
108 NUTCLocal = iota
109 NStdWall
110 NLeap
111 NTime
112 NZone
113 NChar
114 )
115 var n [6]int
116 for i := 0; i < 6; i++ {
117 nn, ok := d.big4()
118 if !ok {
119 return nil, badData
120 }
121 n[i] = int(nn)
122 }
123
124 // Transition times.
Russ Cox225a2e12017-11-21 10:09:05 -0500125 txtimes := dataIO{d.read(n[NTime] * 4), false}
Russ Coxad17a9c2012-02-18 21:02:41 -0500126
127 // Time zone indices for transition times.
128 txzones := d.read(n[NTime])
129
130 // Zone info structures
Russ Cox225a2e12017-11-21 10:09:05 -0500131 zonedata := dataIO{d.read(n[NZone] * 6), false}
Russ Coxad17a9c2012-02-18 21:02:41 -0500132
133 // Time zone abbreviations.
134 abbrev := d.read(n[NChar])
135
136 // Leap-second time pairs
137 d.read(n[NLeap] * 8)
138
139 // Whether tx times associated with local time types
140 // are specified as standard time or wall time.
141 isstd := d.read(n[NStdWall])
142
143 // Whether tx times associated with local time types
144 // are specified as UTC or local time.
145 isutc := d.read(n[NUTCLocal])
146
147 if d.error { // ran out of data
148 return nil, badData
149 }
150
Brad Fitzpatrick14a75ec2014-06-03 11:44:17 +0900151 // If version == 2 or 3, the entire file repeats, this time using
Russ Coxad17a9c2012-02-18 21:02:41 -0500152 // 8-byte ints for txtimes and leap seconds.
153 // We won't need those until 2106.
154
155 // Now we can build up a useful data structure.
156 // First the zone information.
157 // utcoff[4] isdst[1] nameindex[1]
158 zone := make([]zone, n[NZone])
159 for i := range zone {
160 var ok bool
161 var n uint32
162 if n, ok = zonedata.big4(); !ok {
163 return nil, badData
164 }
Russ Coxedce6342012-09-23 23:04:28 -0400165 zone[i].offset = int(int32(n))
Russ Coxad17a9c2012-02-18 21:02:41 -0500166 var b byte
167 if b, ok = zonedata.byte(); !ok {
168 return nil, badData
169 }
170 zone[i].isDST = b != 0
171 if b, ok = zonedata.byte(); !ok || int(b) >= len(abbrev) {
172 return nil, badData
173 }
174 zone[i].name = byteString(abbrev[b:])
175 }
176
177 // Now the transition time info.
178 tx := make([]zoneTrans, n[NTime])
179 for i := range tx {
180 var ok bool
181 var n uint32
182 if n, ok = txtimes.big4(); !ok {
183 return nil, badData
184 }
185 tx[i].when = int64(int32(n))
186 if int(txzones[i]) >= len(zone) {
187 return nil, badData
188 }
189 tx[i].index = txzones[i]
190 if i < len(isstd) {
191 tx[i].isstd = isstd[i] != 0
192 }
193 if i < len(isutc) {
194 tx[i].isutc = isutc[i] != 0
195 }
196 }
197
Russ Cox6a003d72013-02-03 22:41:00 -0500198 if len(tx) == 0 {
199 // Build fake transition to cover all time.
200 // This happens in fixed locations like "Etc/GMT0".
Ian Lance Taylorfabd2612014-01-31 17:22:10 -0800201 tx = append(tx, zoneTrans{when: alpha, index: 0})
Russ Cox6a003d72013-02-03 22:41:00 -0500202 }
203
Shenghou Mad1ef9b52012-12-19 03:04:09 +0800204 // Committed to succeed.
Florian Uekermann7340d132017-09-18 19:22:29 +0200205 l := &Location{zone: zone, tx: tx, name: name}
Russ Coxad17a9c2012-02-18 21:02:41 -0500206
207 // Fill in the cache with information about right now,
208 // since that will be the most common lookup.
Russ Cox0e335592017-02-02 16:20:58 -0500209 sec, _, _ := now()
Russ Coxad17a9c2012-02-18 21:02:41 -0500210 for i := range tx {
211 if tx[i].when <= sec && (i+1 == len(tx) || sec < tx[i+1].when) {
212 l.cacheStart = tx[i].when
Ian Lance Taylorfabd2612014-01-31 17:22:10 -0800213 l.cacheEnd = omega
Russ Coxad17a9c2012-02-18 21:02:41 -0500214 if i+1 < len(tx) {
215 l.cacheEnd = tx[i+1].when
216 }
217 l.cacheZone = &l.zone[tx[i].index]
218 }
219 }
220
221 return l, nil
222}
223
Russ Cox02298ae2017-11-15 17:53:30 +0000224// loadTzinfoFromDirOrZip returns the contents of the file with the given name
225// in dir. dir can either be an uncompressed zip file, or a directory.
226func loadTzinfoFromDirOrZip(dir, name string) ([]byte, error) {
227 if len(dir) > 4 && dir[len(dir)-4:] == ".zip" {
228 return loadTzinfoFromZip(dir, name)
229 }
230 if dir != "" {
231 name = dir + "/" + name
232 }
233 return readFile(name)
234}
235
Brad Fitzpatrick5fea2cc2016-03-01 23:21:55 +0000236// There are 500+ zoneinfo files. Rather than distribute them all
Russ Coxcb5e1812012-02-19 03:16:20 -0500237// individually, we ship them in an uncompressed zip file.
238// Used this way, the zip file format serves as a commonly readable
Brad Fitzpatrick5fea2cc2016-03-01 23:21:55 +0000239// container for the individual small files. We choose zip over tar
Russ Coxcb5e1812012-02-19 03:16:20 -0500240// because zip files have a contiguous table of contents, making
241// individual file lookups faster, and because the per-file overhead
242// in a zip file is considerably less than tar's 512 bytes.
243
244// get4 returns the little-endian 32-bit value in b.
245func get4(b []byte) int {
246 if len(b) < 4 {
247 return 0
248 }
249 return int(b[0]) | int(b[1])<<8 | int(b[2])<<16 | int(b[3])<<24
250}
251
252// get2 returns the little-endian 16-bit value in b.
253func get2(b []byte) int {
254 if len(b) < 2 {
255 return 0
256 }
257 return int(b[0]) | int(b[1])<<8
258}
259
Florian Uekermann7340d132017-09-18 19:22:29 +0200260// loadTzinfoFromZip returns the contents of the file with the given name
261// in the given uncompressed zip file.
262func loadTzinfoFromZip(zipfile, name string) ([]byte, error) {
Russ Coxcb5e1812012-02-19 03:16:20 -0500263 fd, err := open(zipfile)
264 if err != nil {
265 return nil, errors.New("open " + zipfile + ": " + err.Error())
266 }
267 defer closefd(fd)
268
269 const (
270 zecheader = 0x06054b50
271 zcheader = 0x02014b50
272 ztailsize = 22
273
274 zheadersize = 30
275 zheader = 0x04034b50
276 )
277
278 buf := make([]byte, ztailsize)
279 if err := preadn(fd, buf, -ztailsize); err != nil || get4(buf) != zecheader {
280 return nil, errors.New("corrupt zip file " + zipfile)
281 }
282 n := get2(buf[10:])
283 size := get4(buf[12:])
284 off := get4(buf[16:])
285
286 buf = make([]byte, size)
287 if err := preadn(fd, buf, off); err != nil {
288 return nil, errors.New("corrupt zip file " + zipfile)
289 }
290
291 for i := 0; i < n; i++ {
292 // zip entry layout:
293 // 0 magic[4]
294 // 4 madevers[1]
295 // 5 madeos[1]
296 // 6 extvers[1]
297 // 7 extos[1]
298 // 8 flags[2]
299 // 10 meth[2]
300 // 12 modtime[2]
301 // 14 moddate[2]
302 // 16 crc[4]
303 // 20 csize[4]
304 // 24 uncsize[4]
305 // 28 namelen[2]
306 // 30 xlen[2]
307 // 32 fclen[2]
308 // 34 disknum[2]
309 // 36 iattr[2]
310 // 38 eattr[4]
311 // 42 off[4]
312 // 46 name[namelen]
313 // 46+namelen+xlen+fclen - next header
Robert Griesemer465b9c32012-10-30 13:38:01 -0700314 //
Russ Coxcb5e1812012-02-19 03:16:20 -0500315 if get4(buf) != zcheader {
316 break
317 }
318 meth := get2(buf[10:])
319 size := get4(buf[24:])
320 namelen := get2(buf[28:])
321 xlen := get2(buf[30:])
322 fclen := get2(buf[32:])
323 off := get4(buf[42:])
324 zname := buf[46 : 46+namelen]
325 buf = buf[46+namelen+xlen+fclen:]
326 if string(zname) != name {
327 continue
328 }
329 if meth != 0 {
330 return nil, errors.New("unsupported compression for " + name + " in " + zipfile)
331 }
332
333 // zip per-file header layout:
334 // 0 magic[4]
335 // 4 extvers[1]
336 // 5 extos[1]
337 // 6 flags[2]
338 // 8 meth[2]
339 // 10 modtime[2]
340 // 12 moddate[2]
341 // 14 crc[4]
342 // 18 csize[4]
343 // 22 uncsize[4]
344 // 26 namelen[2]
345 // 28 xlen[2]
346 // 30 name[namelen]
347 // 30+namelen+xlen - file data
348 //
349 buf = make([]byte, zheadersize+namelen)
350 if err := preadn(fd, buf, off); err != nil ||
351 get4(buf) != zheader ||
352 get2(buf[8:]) != meth ||
353 get2(buf[26:]) != namelen ||
354 string(buf[30:30+namelen]) != name {
355 return nil, errors.New("corrupt zip file " + zipfile)
356 }
357 xlen = get2(buf[28:])
358
359 buf = make([]byte, size)
360 if err := preadn(fd, buf, off+30+namelen+xlen); err != nil {
361 return nil, errors.New("corrupt zip file " + zipfile)
362 }
363
Florian Uekermann7340d132017-09-18 19:22:29 +0200364 return buf, nil
Russ Coxcb5e1812012-02-19 03:16:20 -0500365 }
366
Russ Cox02298ae2017-11-15 17:53:30 +0000367 return nil, errors.New("cannot find " + name + " in zip file " + zipfile)
Russ Coxcb5e1812012-02-19 03:16:20 -0500368}
Florian Uekermann7340d132017-09-18 19:22:29 +0200369
370// loadTzinfoFromTzdata returns the time zone information of the time zone
371// with the given name, from a tzdata database file as they are typically
372// found on android.
Russ Cox02298ae2017-11-15 17:53:30 +0000373var loadTzinfoFromTzdata func(file, name string) ([]byte, error)
Florian Uekermann7340d132017-09-18 19:22:29 +0200374
375// loadTzinfo returns the time zone information of the time zone
376// with the given name, from a given source. A source may be a
377// timezone database directory, tzdata database file or an uncompressed
378// zip file, containing the contents of such a directory.
379func loadTzinfo(name string, source string) ([]byte, error) {
380 if len(source) >= 6 && source[len(source)-6:] == "tzdata" {
381 return loadTzinfoFromTzdata(source, name)
382 }
Russ Cox02298ae2017-11-15 17:53:30 +0000383 return loadTzinfoFromDirOrZip(source, name)
Florian Uekermann7340d132017-09-18 19:22:29 +0200384}
385
386// loadLocation returns the Location with the given name from one of
387// the specified sources. See loadTzinfo for a list of supported sources.
388// The first timezone data matching the given name that is successfully loaded
389// and parsed is returned as a Location.
390func loadLocation(name string, sources []string) (z *Location, firstErr error) {
391 for _, source := range sources {
392 var zoneData, err = loadTzinfo(name, source)
393 if err == nil {
Florian Uekermann2951f902017-10-06 17:16:43 +0200394 if z, err = LoadLocationFromTZData(name, zoneData); err == nil {
Florian Uekermann7340d132017-09-18 19:22:29 +0200395 return z, nil
396 }
397 }
398 if firstErr == nil && err != syscall.ENOENT {
399 firstErr = err
400 }
401 }
402 if firstErr != nil {
403 return nil, firstErr
404 }
405 return nil, errors.New("unknown time zone " + name)
406}
Ian Lance Taylor71d08322017-09-26 10:50:57 -0700407
408// readFile reads and returns the content of the named file.
409// It is a trivial implementation of ioutil.ReadFile, reimplemented
410// here to avoid depending on io/ioutil or os.
411// It returns an error if name exceeds maxFileSize bytes.
412func readFile(name string) ([]byte, error) {
413 f, err := open(name)
414 if err != nil {
415 return nil, err
416 }
417 defer closefd(f)
418 var (
419 buf [4096]byte
420 ret []byte
421 n int
422 )
423 for {
424 n, err = read(f, buf[:])
425 if n > 0 {
426 ret = append(ret, buf[:n]...)
427 }
428 if n == 0 || err != nil {
429 break
430 }
431 if len(ret) > maxFileSize {
432 return nil, fileSizeError(name)
433 }
434 }
435 return ret, err
436}