Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 1 | // Copyright 2009 The Go Authors. All rights reserved. |
| 2 | // Use of this source code is governed by a BSD-style |
| 3 | // license that can be found in the LICENSE file. |
| 4 | |
Nigel Tao | 6a186d3 | 2011-04-20 09:57:05 +1000 | [diff] [blame] | 5 | // Package pem implements the PEM data encoding, which originated in Privacy |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 6 | // Enhanced Mail. The most common use of PEM encoding today is in TLS keys and |
| 7 | // certificates. See RFC 1421. |
| 8 | package pem |
| 9 | |
| 10 | import ( |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 11 | "bytes" |
| 12 | "encoding/base64" |
Adam Langley | d5841ca | 2010-02-07 15:22:36 -0500 | [diff] [blame] | 13 | "io" |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 14 | ) |
| 15 | |
| 16 | // A Block represents a PEM encoded structure. |
| 17 | // |
| 18 | // The encoded form is: |
| 19 | // -----BEGIN Type----- |
| 20 | // Headers |
| 21 | // base64-encoded Bytes |
| 22 | // -----END Type----- |
| 23 | // where Headers is a possibly empty sequence of Key: Value lines. |
| 24 | type Block struct { |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 25 | Type string // The type, taken from the preamble (i.e. "RSA PRIVATE KEY"). |
| 26 | Headers map[string]string // Optional headers. |
| 27 | Bytes []byte // The decoded bytes of the contents. Typically a DER encoded ASN.1 structure. |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 28 | } |
| 29 | |
| 30 | // getLine results the first \r\n or \n delineated line from the given byte |
| 31 | // array. The line does not include the \r\n or \n. The remainder of the byte |
| 32 | // array (also not including the new line bytes) is also returned and this will |
| 33 | // always be smaller than the original argument. |
| 34 | func getLine(data []byte) (line, rest []byte) { |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 35 | i := bytes.Index(data, []byte{'\n'}) |
| 36 | var j int |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 37 | if i < 0 { |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 38 | i = len(data) |
| 39 | j = i |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 40 | } else { |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 41 | j = i + 1 |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 42 | if i > 0 && data[i-1] == '\r' { |
Robert Griesemer | 40621d5 | 2009-11-09 12:07:39 -0800 | [diff] [blame] | 43 | i-- |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 44 | } |
| 45 | } |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 46 | return data[0:i], data[j:] |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 47 | } |
| 48 | |
| 49 | // removeWhitespace returns a copy of its input with all spaces, tab and |
| 50 | // newline characters removed. |
| 51 | func removeWhitespace(data []byte) []byte { |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 52 | result := make([]byte, len(data)) |
| 53 | n := 0 |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 54 | |
| 55 | for _, b := range data { |
| 56 | if b == ' ' || b == '\t' || b == '\r' || b == '\n' { |
Robert Griesemer | 40621d5 | 2009-11-09 12:07:39 -0800 | [diff] [blame] | 57 | continue |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 58 | } |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 59 | result[n] = b |
| 60 | n++ |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 61 | } |
| 62 | |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 63 | return result[0:n] |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 64 | } |
| 65 | |
Russ Cox | 9750adb | 2010-02-25 16:01:29 -0800 | [diff] [blame] | 66 | var pemStart = []byte("\n-----BEGIN ") |
| 67 | var pemEnd = []byte("\n-----END ") |
| 68 | var pemEndOfLine = []byte("-----") |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 69 | |
| 70 | // Decode will find the next PEM formatted block (certificate, private key |
| 71 | // etc) in the input. It returns that block and the remainder of the input. If |
Adam Langley | 7d68093 | 2009-10-21 19:47:52 -0700 | [diff] [blame] | 72 | // no PEM data is found, p is nil and the whole of the input is returned in |
| 73 | // rest. |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 74 | func Decode(data []byte) (p *Block, rest []byte) { |
| 75 | // pemStart begins with a newline. However, at the very beginning of |
| 76 | // the byte array, we'll accept the start string without it. |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 77 | rest = data |
Russ Cox | 9ac4449 | 2009-11-20 11:45:05 -0800 | [diff] [blame] | 78 | if bytes.HasPrefix(data, pemStart[1:]) { |
Robert Griesemer | 40621d5 | 2009-11-09 12:07:39 -0800 | [diff] [blame] | 79 | rest = rest[len(pemStart)-1 : len(data)] |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 80 | } else if i := bytes.Index(data, pemStart); i >= 0 { |
Robert Griesemer | 40621d5 | 2009-11-09 12:07:39 -0800 | [diff] [blame] | 81 | rest = rest[i+len(pemStart) : len(data)] |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 82 | } else { |
Robert Griesemer | 40621d5 | 2009-11-09 12:07:39 -0800 | [diff] [blame] | 83 | return nil, data |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 84 | } |
| 85 | |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 86 | typeLine, rest := getLine(rest) |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 87 | if !bytes.HasSuffix(typeLine, pemEndOfLine) { |
Russ Cox | 21e75da | 2011-06-17 06:07:13 -0400 | [diff] [blame] | 88 | return decodeError(data, rest) |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 89 | } |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 90 | typeLine = typeLine[0 : len(typeLine)-len(pemEndOfLine)] |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 91 | |
| 92 | p = &Block{ |
| 93 | Headers: make(map[string]string), |
Robert Griesemer | f44fa9b | 2010-03-02 13:46:51 -0800 | [diff] [blame] | 94 | Type: string(typeLine), |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 95 | } |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 96 | |
| 97 | for { |
| 98 | // This loop terminates because getLine's second result is |
Brad Fitzpatrick | dcdaeeb | 2011-07-13 10:54:51 -0700 | [diff] [blame] | 99 | // always smaller than its argument. |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 100 | if len(rest) == 0 { |
Robert Griesemer | 40621d5 | 2009-11-09 12:07:39 -0800 | [diff] [blame] | 101 | return nil, data |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 102 | } |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 103 | line, next := getLine(rest) |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 104 | |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 105 | i := bytes.Index(line, []byte{':'}) |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 106 | if i == -1 { |
Robert Griesemer | 40621d5 | 2009-11-09 12:07:39 -0800 | [diff] [blame] | 107 | break |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 108 | } |
| 109 | |
| 110 | // TODO(agl): need to cope with values that spread across lines. |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 111 | key, val := line[0:i], line[i+1:] |
| 112 | key = bytes.TrimSpace(key) |
| 113 | val = bytes.TrimSpace(val) |
| 114 | p.Headers[string(key)] = string(val) |
| 115 | rest = next |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 116 | } |
| 117 | |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 118 | i := bytes.Index(rest, pemEnd) |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 119 | if i < 0 { |
Russ Cox | 21e75da | 2011-06-17 06:07:13 -0400 | [diff] [blame] | 120 | return decodeError(data, rest) |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 121 | } |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 122 | base64Data := removeWhitespace(rest[0:i]) |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 123 | |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 124 | p.Bytes = make([]byte, base64.StdEncoding.DecodedLen(len(base64Data))) |
| 125 | n, err := base64.StdEncoding.Decode(p.Bytes, base64Data) |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 126 | if err != nil { |
Russ Cox | 21e75da | 2011-06-17 06:07:13 -0400 | [diff] [blame] | 127 | return decodeError(data, rest) |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 128 | } |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 129 | p.Bytes = p.Bytes[0:n] |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 130 | |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 131 | _, rest = getLine(rest[i+len(pemEnd):]) |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 132 | |
Robert Griesemer | 1c72959 | 2009-12-15 15:27:16 -0800 | [diff] [blame] | 133 | return |
Russ Cox | 21e75da | 2011-06-17 06:07:13 -0400 | [diff] [blame] | 134 | } |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 135 | |
Russ Cox | 21e75da | 2011-06-17 06:07:13 -0400 | [diff] [blame] | 136 | func decodeError(data, rest []byte) (*Block, []byte) { |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 137 | // If we get here then we have rejected a likely looking, but |
| 138 | // ultimately invalid PEM block. We need to start over from a new |
| 139 | // position. We have consumed the preamble line and will have consumed |
| 140 | // any lines which could be header lines. However, a valid preamble |
| 141 | // line is not a valid header line, therefore we cannot have consumed |
| 142 | // the preamble line for the any subsequent block. Thus, we will always |
Robert Hencke | c8727c8 | 2011-05-18 13:14:56 -0400 | [diff] [blame] | 143 | // find any valid block, no matter what bytes precede it. |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 144 | // |
| 145 | // For example, if the input is |
| 146 | // |
| 147 | // -----BEGIN MALFORMED BLOCK----- |
| 148 | // junk that may look like header lines |
| 149 | // or data lines, but no END line |
| 150 | // |
| 151 | // -----BEGIN ACTUAL BLOCK----- |
| 152 | // realdata |
| 153 | // -----END ACTUAL BLOCK----- |
| 154 | // |
| 155 | // we've failed to parse using the first BEGIN line |
| 156 | // and now will try again, using the second BEGIN line. |
Russ Cox | 21e75da | 2011-06-17 06:07:13 -0400 | [diff] [blame] | 157 | p, rest := Decode(rest) |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 158 | if p == nil { |
Robert Griesemer | 40621d5 | 2009-11-09 12:07:39 -0800 | [diff] [blame] | 159 | rest = data |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 160 | } |
Russ Cox | 21e75da | 2011-06-17 06:07:13 -0400 | [diff] [blame] | 161 | return p, rest |
Adam Langley | fd74a83 | 2009-10-21 17:53:50 -0700 | [diff] [blame] | 162 | } |
Adam Langley | d5841ca | 2010-02-07 15:22:36 -0500 | [diff] [blame] | 163 | |
| 164 | const pemLineLength = 64 |
| 165 | |
| 166 | type lineBreaker struct { |
| 167 | line [pemLineLength]byte |
| 168 | used int |
| 169 | out io.Writer |
| 170 | } |
| 171 | |
Russ Cox | c2049d2 | 2011-11-01 22:04:37 -0400 | [diff] [blame^] | 172 | func (l *lineBreaker) Write(b []byte) (n int, err error) { |
Adam Langley | d5841ca | 2010-02-07 15:22:36 -0500 | [diff] [blame] | 173 | if l.used+len(b) < pemLineLength { |
| 174 | copy(l.line[l.used:], b) |
| 175 | l.used += len(b) |
| 176 | return len(b), nil |
| 177 | } |
| 178 | |
| 179 | n, err = l.out.Write(l.line[0:l.used]) |
| 180 | if err != nil { |
| 181 | return |
| 182 | } |
| 183 | excess := pemLineLength - l.used |
| 184 | l.used = 0 |
| 185 | |
| 186 | n, err = l.out.Write(b[0:excess]) |
| 187 | if err != nil { |
| 188 | return |
| 189 | } |
| 190 | |
| 191 | n, err = l.out.Write([]byte{'\n'}) |
| 192 | if err != nil { |
| 193 | return |
| 194 | } |
| 195 | |
| 196 | return l.Write(b[excess:]) |
| 197 | } |
| 198 | |
Russ Cox | c2049d2 | 2011-11-01 22:04:37 -0400 | [diff] [blame^] | 199 | func (l *lineBreaker) Close() (err error) { |
Adam Langley | d5841ca | 2010-02-07 15:22:36 -0500 | [diff] [blame] | 200 | if l.used > 0 { |
| 201 | _, err = l.out.Write(l.line[0:l.used]) |
| 202 | if err != nil { |
| 203 | return |
| 204 | } |
| 205 | _, err = l.out.Write([]byte{'\n'}) |
| 206 | } |
| 207 | |
| 208 | return |
| 209 | } |
| 210 | |
Russ Cox | c2049d2 | 2011-11-01 22:04:37 -0400 | [diff] [blame^] | 211 | func Encode(out io.Writer, b *Block) (err error) { |
Adam Langley | d5841ca | 2010-02-07 15:22:36 -0500 | [diff] [blame] | 212 | _, err = out.Write(pemStart[1:]) |
| 213 | if err != nil { |
| 214 | return |
| 215 | } |
Russ Cox | 9750adb | 2010-02-25 16:01:29 -0800 | [diff] [blame] | 216 | _, err = out.Write([]byte(b.Type + "-----\n")) |
Adam Langley | d5841ca | 2010-02-07 15:22:36 -0500 | [diff] [blame] | 217 | if err != nil { |
| 218 | return |
| 219 | } |
| 220 | |
Russ Cox | 36560d2 | 2010-07-12 16:48:49 -0700 | [diff] [blame] | 221 | if len(b.Headers) > 0 { |
| 222 | for k, v := range b.Headers { |
| 223 | _, err = out.Write([]byte(k + ": " + v + "\n")) |
| 224 | if err != nil { |
| 225 | return |
| 226 | } |
Adam Langley | d5841ca | 2010-02-07 15:22:36 -0500 | [diff] [blame] | 227 | } |
Adam Langley | d5841ca | 2010-02-07 15:22:36 -0500 | [diff] [blame] | 228 | _, err = out.Write([]byte{'\n'}) |
| 229 | if err != nil { |
| 230 | return |
| 231 | } |
| 232 | } |
| 233 | |
| 234 | var breaker lineBreaker |
| 235 | breaker.out = out |
| 236 | |
| 237 | b64 := base64.NewEncoder(base64.StdEncoding, &breaker) |
| 238 | _, err = b64.Write(b.Bytes) |
| 239 | if err != nil { |
| 240 | return |
| 241 | } |
| 242 | b64.Close() |
| 243 | breaker.Close() |
| 244 | |
| 245 | _, err = out.Write(pemEnd[1:]) |
| 246 | if err != nil { |
| 247 | return |
| 248 | } |
Russ Cox | 9750adb | 2010-02-25 16:01:29 -0800 | [diff] [blame] | 249 | _, err = out.Write([]byte(b.Type + "-----\n")) |
Adam Langley | d5841ca | 2010-02-07 15:22:36 -0500 | [diff] [blame] | 250 | return |
| 251 | } |
| 252 | |
| 253 | func EncodeToMemory(b *Block) []byte { |
| 254 | buf := bytes.NewBuffer(nil) |
| 255 | Encode(buf, b) |
| 256 | return buf.Bytes() |
| 257 | } |