Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 1 | // Copyright 2009 The Go Authors. All rights reserved. |
| 2 | // Use of this source code is governed by a BSD-style |
| 3 | // license that can be found in the LICENSE file. |
| 4 | |
| 5 | package strings |
| 6 | |
Kyle Consalus | d7b4851 | 2010-04-20 22:18:26 -0700 | [diff] [blame] | 7 | import ( |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 8 | "errors" |
| 9 | "io" |
Rob Pike | 45e3bcb | 2011-11-08 15:41:54 -0800 | [diff] [blame] | 10 | "unicode/utf8" |
Kyle Consalus | d7b4851 | 2010-04-20 22:18:26 -0700 | [diff] [blame] | 11 | ) |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 12 | |
Evan Shaw | eae25d4 | 2012-10-12 14:43:50 +1100 | [diff] [blame] | 13 | // A Reader implements the io.Reader, io.ReaderAt, io.Seeker, io.WriterTo, |
Brad Fitzpatrick | 7127b6f | 2012-02-15 12:58:00 +1100 | [diff] [blame] | 14 | // io.ByteScanner, and io.RuneScanner interfaces by reading |
| 15 | // from a string. |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 16 | type Reader struct { |
| 17 | s string |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 18 | i int64 // current reading index |
| 19 | prevRune int // index of previous rune; or < 0 |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 20 | } |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 21 | |
Brad Fitzpatrick | 2198050 | 2011-05-31 08:47:03 -0700 | [diff] [blame] | 22 | // Len returns the number of bytes of the unread portion of the |
| 23 | // string. |
| 24 | func (r *Reader) Len() int { |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 25 | if r.i >= int64(len(r.s)) { |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 26 | return 0 |
| 27 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 28 | return int(int64(len(r.s)) - r.i) |
Brad Fitzpatrick | 2198050 | 2011-05-31 08:47:03 -0700 | [diff] [blame] | 29 | } |
| 30 | |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 31 | func (r *Reader) Read(b []byte) (n int, err error) { |
Rui Ueyama | a509026 | 2014-03-19 09:00:58 -0700 | [diff] [blame] | 32 | r.prevRune = -1 |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 33 | if len(b) == 0 { |
| 34 | return 0, nil |
| 35 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 36 | if r.i >= int64(len(r.s)) { |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 37 | return 0, io.EOF |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 38 | } |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 39 | n = copy(b, r.s[r.i:]) |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 40 | r.i += int64(n) |
Robert Griesemer | d65a5cc | 2009-12-15 15:40:16 -0800 | [diff] [blame] | 41 | return |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 42 | } |
| 43 | |
Brad Fitzpatrick | 7127b6f | 2012-02-15 12:58:00 +1100 | [diff] [blame] | 44 | func (r *Reader) ReadAt(b []byte, off int64) (n int, err error) { |
Brad Fitzpatrick | 2dbc5d2 | 2014-04-10 15:46:07 -0700 | [diff] [blame] | 45 | // cannot modify state - see io.ReaderAt |
Brad Fitzpatrick | 7127b6f | 2012-02-15 12:58:00 +1100 | [diff] [blame] | 46 | if off < 0 { |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame^] | 47 | return 0, errors.New("strings.Reader.ReadAt: negative offset") |
Brad Fitzpatrick | 7127b6f | 2012-02-15 12:58:00 +1100 | [diff] [blame] | 48 | } |
| 49 | if off >= int64(len(r.s)) { |
| 50 | return 0, io.EOF |
| 51 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 52 | n = copy(b, r.s[off:]) |
Brad Fitzpatrick | 7127b6f | 2012-02-15 12:58:00 +1100 | [diff] [blame] | 53 | if n < len(b) { |
| 54 | err = io.EOF |
| 55 | } |
| 56 | return |
| 57 | } |
| 58 | |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 59 | func (r *Reader) ReadByte() (b byte, err error) { |
Rui Ueyama | a509026 | 2014-03-19 09:00:58 -0700 | [diff] [blame] | 60 | r.prevRune = -1 |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 61 | if r.i >= int64(len(r.s)) { |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 62 | return 0, io.EOF |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 63 | } |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 64 | b = r.s[r.i] |
| 65 | r.i++ |
Robert Griesemer | d65a5cc | 2009-12-15 15:40:16 -0800 | [diff] [blame] | 66 | return |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 67 | } |
| 68 | |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 69 | func (r *Reader) UnreadByte() error { |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame^] | 70 | r.prevRune = -1 |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 71 | if r.i <= 0 { |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame^] | 72 | return errors.New("strings.Reader.UnreadByte: at beginning of string") |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 73 | } |
| 74 | r.i-- |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 75 | return nil |
| 76 | } |
| 77 | |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 78 | func (r *Reader) ReadRune() (ch rune, size int, err error) { |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 79 | if r.i >= int64(len(r.s)) { |
Rui Ueyama | a509026 | 2014-03-19 09:00:58 -0700 | [diff] [blame] | 80 | r.prevRune = -1 |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 81 | return 0, 0, io.EOF |
Kyle Consalus | d7b4851 | 2010-04-20 22:18:26 -0700 | [diff] [blame] | 82 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 83 | r.prevRune = int(r.i) |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 84 | if c := r.s[r.i]; c < utf8.RuneSelf { |
| 85 | r.i++ |
Russ Cox | 8f57181 | 2011-10-25 22:22:09 -0700 | [diff] [blame] | 86 | return rune(c), 1, nil |
Kyle Consalus | d7b4851 | 2010-04-20 22:18:26 -0700 | [diff] [blame] | 87 | } |
Russ Cox | 8f57181 | 2011-10-25 22:22:09 -0700 | [diff] [blame] | 88 | ch, size = utf8.DecodeRuneInString(r.s[r.i:]) |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 89 | r.i += int64(size) |
Kyle Consalus | d7b4851 | 2010-04-20 22:18:26 -0700 | [diff] [blame] | 90 | return |
| 91 | } |
| 92 | |
Russ Cox | eb69292 | 2011-11-01 22:05:34 -0400 | [diff] [blame] | 93 | func (r *Reader) UnreadRune() error { |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 94 | if r.prevRune < 0 { |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame^] | 95 | return errors.New("strings.Reader.UnreadRune: previous operation was not ReadRune") |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 96 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 97 | r.i = int64(r.prevRune) |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 98 | r.prevRune = -1 |
| 99 | return nil |
| 100 | } |
| 101 | |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 102 | // Seek implements the io.Seeker interface. |
| 103 | func (r *Reader) Seek(offset int64, whence int) (int64, error) { |
Rui Ueyama | a509026 | 2014-03-19 09:00:58 -0700 | [diff] [blame] | 104 | r.prevRune = -1 |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 105 | var abs int64 |
| 106 | switch whence { |
| 107 | case 0: |
| 108 | abs = offset |
| 109 | case 1: |
| 110 | abs = int64(r.i) + offset |
| 111 | case 2: |
| 112 | abs = int64(len(r.s)) + offset |
| 113 | default: |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame^] | 114 | return 0, errors.New("strings.Reader.Seek: invalid whence") |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 115 | } |
| 116 | if abs < 0 { |
Robert Griesemer | 08d8eca | 2014-04-10 21:45:41 -0700 | [diff] [blame^] | 117 | return 0, errors.New("strings.Reader.Seek: negative position") |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 118 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 119 | r.i = abs |
Brad Fitzpatrick | 396170d | 2012-02-09 17:28:41 +1100 | [diff] [blame] | 120 | return abs, nil |
| 121 | } |
| 122 | |
Evan Shaw | eae25d4 | 2012-10-12 14:43:50 +1100 | [diff] [blame] | 123 | // WriteTo implements the io.WriterTo interface. |
| 124 | func (r *Reader) WriteTo(w io.Writer) (n int64, err error) { |
| 125 | r.prevRune = -1 |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 126 | if r.i >= int64(len(r.s)) { |
Brad Fitzpatrick | c8fa7dc | 2012-11-25 09:04:13 -0800 | [diff] [blame] | 127 | return 0, nil |
Evan Shaw | eae25d4 | 2012-10-12 14:43:50 +1100 | [diff] [blame] | 128 | } |
| 129 | s := r.s[r.i:] |
| 130 | m, err := io.WriteString(w, s) |
| 131 | if m > len(s) { |
| 132 | panic("strings.Reader.WriteTo: invalid WriteString count") |
| 133 | } |
Brad Fitzpatrick | f074565 | 2014-03-28 12:23:51 -0700 | [diff] [blame] | 134 | r.i += int64(m) |
Evan Shaw | eae25d4 | 2012-10-12 14:43:50 +1100 | [diff] [blame] | 135 | n = int64(m) |
| 136 | if m != len(s) && err == nil { |
| 137 | err = io.ErrShortWrite |
| 138 | } |
| 139 | return |
| 140 | } |
| 141 | |
Russ Cox | 10c7d19 | 2009-10-12 10:09:35 -0700 | [diff] [blame] | 142 | // NewReader returns a new Reader reading from s. |
| 143 | // It is similar to bytes.NewBufferString but more efficient and read-only. |
Robert Griesemer | 9cd3372 | 2011-05-26 11:02:07 -0700 | [diff] [blame] | 144 | func NewReader(s string) *Reader { return &Reader{s, 0, -1} } |