Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 1 | // Copyright 2009 The Go Authors. All rights reserved. |
| 2 | // Use of this source code is governed by a BSD-style |
| 3 | // license that can be found in the LICENSE file. |
| 4 | |
| 5 | package strings |
| 6 | |
Kyle Consalus | d7b4851 | 2010-04-20 22:18:26 -0700 | [diff] [blame] | 7 | import ( |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 8 | "errors" |
| 9 | "io" |
Rob Pike | 45e3bcb | 2011-11-08 15:41:54 -0800 | [diff] [blame] | 10 | "unicode/utf8" |
Kyle Consalus | d7b4851 | 2010-04-20 22:18:26 -0700 | [diff] [blame] | 11 | ) |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 12 | |
Evan Shaw | eae25d4 | 2012-10-12 14:43:50 +1100 | [diff] [blame] | 13 | // A Reader implements the io.Reader, io.ReaderAt, io.Seeker, io.WriterTo, |
Brad Fitzpatrick | 7127b6f | 2012-02-15 12:58:00 +1100 | [diff] [blame] | 14 | // io.ByteScanner, and io.RuneScanner interfaces by reading |
| 15 | // from a string. |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 16 | type Reader struct { |
| 17 | s string |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 18 | i int64 // current reading index |
| 19 | prevRune int // index of previous rune; or < 0 |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 20 | } |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 21 | |
Brad Fitzpatrick | 2198050 | 2011-05-31 08:47:03 -0700 | [diff] [blame] | 22 | // Len returns the number of bytes of the unread portion of the |
| 23 | // string. |
| 24 | func (r *Reader) Len() int { |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 25 | if r.i >= int64(len(r.s)) { |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 26 | return 0 |
| 27 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 28 | return int(int64(len(r.s)) - r.i) |
Brad Fitzpatrick | 2198050 | 2011-05-31 08:47:03 -0700 | [diff] [blame] | 29 | } |
| 30 | |
Brad Fitzpatrick | c264c87 | 2015-01-22 14:15:47 -0800 | [diff] [blame] | 31 | // Size returns the original length of the underlying string. |
| 32 | // Size is the number of bytes available for reading via ReadAt. |
| 33 | // The returned value is always the same and is not affected by calls |
| 34 | // to any other method. |
| 35 | func (r *Reader) Size() int64 { return int64(len(r.s)) } |
| 36 | |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 37 | func (r *Reader) Read(b []byte) (n int, err error) { |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 38 | if len(b) == 0 { |
| 39 | return 0, nil |
| 40 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 41 | if r.i >= int64(len(r.s)) { |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 42 | return 0, io.EOF |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 43 | } |
Brad Fitzpatrick | 13ea1fd | 2014-04-25 06:44:51 -0700 | [diff] [blame] | 44 | r.prevRune = -1 |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 45 | n = copy(b, r.s[r.i:]) |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 46 | r.i += int64(n) |
Robert Griesemer | d65a5cc | 2009-12-15 15:40:16 -0800 | [diff] [blame] | 47 | return |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 48 | } |
| 49 | |
Brad Fitzpatrick | 7127b6f | 2012-02-15 12:58:00 +1100 | [diff] [blame] | 50 | func (r *Reader) ReadAt(b []byte, off int64) (n int, err error) { |
Brad Fitzpatrick | 2dbc5d2 | 2014-04-10 15:46:07 -0700 | [diff] [blame] | 51 | // cannot modify state - see io.ReaderAt |
Brad Fitzpatrick | 7127b6f | 2012-02-15 12:58:00 +1100 | [diff] [blame] | 52 | if off < 0 { |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame] | 53 | return 0, errors.New("strings.Reader.ReadAt: negative offset") |
Brad Fitzpatrick | 7127b6f | 2012-02-15 12:58:00 +1100 | [diff] [blame] | 54 | } |
| 55 | if off >= int64(len(r.s)) { |
| 56 | return 0, io.EOF |
| 57 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 58 | n = copy(b, r.s[off:]) |
Brad Fitzpatrick | 7127b6f | 2012-02-15 12:58:00 +1100 | [diff] [blame] | 59 | if n < len(b) { |
| 60 | err = io.EOF |
| 61 | } |
| 62 | return |
| 63 | } |
| 64 | |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 65 | func (r *Reader) ReadByte() (b byte, err error) { |
Rui Ueyama | a509026 | 2014-03-19 09:00:58 -0700 | [diff] [blame] | 66 | r.prevRune = -1 |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 67 | if r.i >= int64(len(r.s)) { |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 68 | return 0, io.EOF |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 69 | } |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 70 | b = r.s[r.i] |
| 71 | r.i++ |
Robert Griesemer | d65a5cc | 2009-12-15 15:40:16 -0800 | [diff] [blame] | 72 | return |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 73 | } |
| 74 | |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 75 | func (r *Reader) UnreadByte() error { |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame] | 76 | r.prevRune = -1 |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 77 | if r.i <= 0 { |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame] | 78 | return errors.New("strings.Reader.UnreadByte: at beginning of string") |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 79 | } |
| 80 | r.i-- |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 81 | return nil |
| 82 | } |
| 83 | |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 84 | func (r *Reader) ReadRune() (ch rune, size int, err error) { |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 85 | if r.i >= int64(len(r.s)) { |
Rui Ueyama | a509026 | 2014-03-19 09:00:58 -0700 | [diff] [blame] | 86 | r.prevRune = -1 |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 87 | return 0, 0, io.EOF |
Kyle Consalus | d7b4851 | 2010-04-20 22:18:26 -0700 | [diff] [blame] | 88 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 89 | r.prevRune = int(r.i) |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 90 | if c := r.s[r.i]; c < utf8.RuneSelf { |
| 91 | r.i++ |
Russ Cox | 8f57181 | 2011-10-25 22:22:09 -0700 | [diff] [blame] | 92 | return rune(c), 1, nil |
Kyle Consalus | d7b4851 | 2010-04-20 22:18:26 -0700 | [diff] [blame] | 93 | } |
Russ Cox | 8f57181 | 2011-10-25 22:22:09 -0700 | [diff] [blame] | 94 | ch, size = utf8.DecodeRuneInString(r.s[r.i:]) |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 95 | r.i += int64(size) |
Kyle Consalus | d7b4851 | 2010-04-20 22:18:26 -0700 | [diff] [blame] | 96 | return |
| 97 | } |
| 98 | |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 99 | func (r *Reader) UnreadRune() error { |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 100 | if r.prevRune < 0 { |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame] | 101 | return errors.New("strings.Reader.UnreadRune: previous operation was not ReadRune") |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 102 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 103 | r.i = int64(r.prevRune) |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 104 | r.prevRune = -1 |
| 105 | return nil |
| 106 | } |
| 107 | |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 108 | // Seek implements the io.Seeker interface. |
| 109 | func (r *Reader) Seek(offset int64, whence int) (int64, error) { |
Rui Ueyama | a509026 | 2014-03-19 09:00:58 -0700 | [diff] [blame] | 110 | r.prevRune = -1 |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 111 | var abs int64 |
| 112 | switch whence { |
| 113 | case 0: |
| 114 | abs = offset |
| 115 | case 1: |
| 116 | abs = int64(r.i) + offset |
| 117 | case 2: |
| 118 | abs = int64(len(r.s)) + offset |
| 119 | default: |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame] | 120 | return 0, errors.New("strings.Reader.Seek: invalid whence") |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 121 | } |
| 122 | if abs < 0 { |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame] | 123 | return 0, errors.New("strings.Reader.Seek: negative position") |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 124 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 125 | r.i = abs |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 126 | return abs, nil |
| 127 | } |
| 128 | |
Evan Shaw | eae25d4 | 2012-10-12 14:43:50 +1100 | [diff] [blame] | 129 | // WriteTo implements the io.WriterTo interface. |
| 130 | func (r *Reader) WriteTo(w io.Writer) (n int64, err error) { |
| 131 | r.prevRune = -1 |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 132 | if r.i >= int64(len(r.s)) { |
Brad Fitzpatrick | c8fa7dc | 2012-11-25 09:04:13 -0800 | [diff] [blame] | 133 | return 0, nil |
Evan Shaw | eae25d4 | 2012-10-12 14:43:50 +1100 | [diff] [blame] | 134 | } |
| 135 | s := r.s[r.i:] |
| 136 | m, err := io.WriteString(w, s) |
| 137 | if m > len(s) { |
| 138 | panic("strings.Reader.WriteTo: invalid WriteString count") |
| 139 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 140 | r.i += int64(m) |
Evan Shaw | eae25d4 | 2012-10-12 14:43:50 +1100 | [diff] [blame] | 141 | n = int64(m) |
| 142 | if m != len(s) && err == nil { |
| 143 | err = io.ErrShortWrite |
| 144 | } |
| 145 | return |
| 146 | } |
| 147 | |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 148 | // NewReader returns a new Reader reading from s. |
| 149 | // It is similar to bytes.NewBufferString but more efficient and read-only. |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 150 | func NewReader(s string) *Reader { return &Reader{s, 0, -1} } |