| // Copyright 2020 The Go Authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style |
| // license that can be found in the LICENSE file. |
| |
| package netip_test |
| |
| import ( |
| "fmt" |
| . "net/netip" |
| "strconv" |
| "strings" |
| ) |
| |
| // zeros is a slice of eight stringified zeros. It's used in |
| // parseIPSlow to construct slices of specific amounts of zero fields, |
| // from 1 to 8. |
| var zeros = []string{"0", "0", "0", "0", "0", "0", "0", "0"} |
| |
| // parseIPSlow is like ParseIP, but aims for readability above |
| // speed. It's the reference implementation for correctness checking |
| // and against which we measure optimized parsers. |
| // |
| // parseIPSlow understands the following forms of IP addresses: |
| // - Regular IPv4: 1.2.3.4 |
| // - IPv4 with many leading zeros: 0000001.0000002.0000003.0000004 |
| // - Regular IPv6: 1111:2222:3333:4444:5555:6666:7777:8888 |
| // - IPv6 with many leading zeros: 00000001:0000002:0000003:0000004:0000005:0000006:0000007:0000008 |
| // - IPv6 with zero blocks elided: 1111:2222::7777:8888 |
| // - IPv6 with trailing 32 bits expressed as IPv4: 1111:2222:3333:4444:5555:6666:77.77.88.88 |
| // |
| // It does not process the following IP address forms, which have been |
| // varyingly accepted by some programs due to an under-specification |
| // of the shapes of IPv4 addresses: |
| // |
| // - IPv4 as a single 32-bit uint: 4660 (same as "1.2.3.4") |
| // - IPv4 with octal numbers: 0300.0250.0.01 (same as "192.168.0.1") |
| // - IPv4 with hex numbers: 0xc0.0xa8.0x0.0x1 (same as "192.168.0.1") |
| // - IPv4 in "class-B style": 1.2.52 (same as "1.2.3.4") |
| // - IPv4 in "class-A style": 1.564 (same as "1.2.3.4") |
| func parseIPSlow(s string) (Addr, error) { |
| // Identify and strip out the zone, if any. There should be 0 or 1 |
| // '%' in the string. |
| var zone string |
| fs := strings.Split(s, "%") |
| switch len(fs) { |
| case 1: |
| // No zone, that's fine. |
| case 2: |
| s, zone = fs[0], fs[1] |
| if zone == "" { |
| return Addr{}, fmt.Errorf("netaddr.ParseIP(%q): no zone after zone specifier", s) |
| } |
| default: |
| return Addr{}, fmt.Errorf("netaddr.ParseIP(%q): too many zone specifiers", s) // TODO: less specific? |
| } |
| |
| // IPv4 by itself is easy to do in a helper. |
| if strings.Count(s, ":") == 0 { |
| if zone != "" { |
| return Addr{}, fmt.Errorf("netaddr.ParseIP(%q): IPv4 addresses cannot have a zone", s) |
| } |
| return parseIPv4Slow(s) |
| } |
| |
| normal, err := normalizeIPv6Slow(s) |
| if err != nil { |
| return Addr{}, err |
| } |
| |
| // At this point, we've normalized the address back into 8 hex |
| // fields of 16 bits each. Parse that. |
| fs = strings.Split(normal, ":") |
| if len(fs) != 8 { |
| return Addr{}, fmt.Errorf("netaddr.ParseIP(%q): wrong size address", s) |
| } |
| var ret [16]byte |
| for i, f := range fs { |
| a, b, err := parseWord(f) |
| if err != nil { |
| return Addr{}, err |
| } |
| ret[i*2] = a |
| ret[i*2+1] = b |
| } |
| |
| return AddrFrom16(ret).WithZone(zone), nil |
| } |
| |
| // normalizeIPv6Slow expands s, which is assumed to be an IPv6 |
| // address, to its canonical text form. |
| // |
| // The canonical form of an IPv6 address is 8 colon-separated fields, |
| // where each field should be a hex value from 0 to ffff. This |
| // function does not verify the contents of each field. |
| // |
| // This function performs two transformations: |
| // - The last 32 bits of an IPv6 address may be represented in |
| // IPv4-style dotted quad form, as in 1:2:3:4:5:6:7.8.9.10. That |
| // address is transformed to its hex equivalent, |
| // e.g. 1:2:3:4:5:6:708:90a. |
| // - An address may contain one "::", which expands into as many |
| // 16-bit blocks of zeros as needed to make the address its correct |
| // full size. For example, fe80::1:2 expands to fe80:0:0:0:0:0:1:2. |
| // |
| // Both short forms may be present in a single address, |
| // e.g. fe80::1.2.3.4. |
| func normalizeIPv6Slow(orig string) (string, error) { |
| s := orig |
| |
| // Find and convert an IPv4 address in the final field, if any. |
| i := strings.LastIndex(s, ":") |
| if i == -1 { |
| return "", fmt.Errorf("netaddr.ParseIP(%q): invalid IP address", orig) |
| } |
| if strings.Contains(s[i+1:], ".") { |
| ip, err := parseIPv4Slow(s[i+1:]) |
| if err != nil { |
| return "", err |
| } |
| a4 := ip.As4() |
| s = fmt.Sprintf("%s:%02x%02x:%02x%02x", s[:i], a4[0], a4[1], a4[2], a4[3]) |
| } |
| |
| // Find and expand a ::, if any. |
| fs := strings.Split(s, "::") |
| switch len(fs) { |
| case 1: |
| // No ::, nothing to do. |
| case 2: |
| lhs, rhs := fs[0], fs[1] |
| // Found a ::, figure out how many zero blocks need to be |
| // inserted. |
| nblocks := strings.Count(lhs, ":") + strings.Count(rhs, ":") |
| if lhs != "" { |
| nblocks++ |
| } |
| if rhs != "" { |
| nblocks++ |
| } |
| if nblocks > 7 { |
| return "", fmt.Errorf("netaddr.ParseIP(%q): address too long", orig) |
| } |
| fs = nil |
| // Either side of the :: can be empty. We don't want empty |
| // fields to feature in the final normalized address. |
| if lhs != "" { |
| fs = append(fs, lhs) |
| } |
| fs = append(fs, zeros[:8-nblocks]...) |
| if rhs != "" { |
| fs = append(fs, rhs) |
| } |
| s = strings.Join(fs, ":") |
| default: |
| // Too many :: |
| return "", fmt.Errorf("netaddr.ParseIP(%q): invalid IP address", orig) |
| } |
| |
| return s, nil |
| } |
| |
| // parseIPv4Slow parses and returns an IPv4 address in dotted quad |
| // form, e.g. "192.168.0.1". It is slow but easy to read, and the |
| // reference implementation against which we compare faster |
| // implementations for correctness. |
| func parseIPv4Slow(s string) (Addr, error) { |
| fs := strings.Split(s, ".") |
| if len(fs) != 4 { |
| return Addr{}, fmt.Errorf("netaddr.ParseIP(%q): invalid IP address", s) |
| } |
| var ret [4]byte |
| for i := range ret { |
| val, err := strconv.ParseUint(fs[i], 10, 8) |
| if err != nil { |
| return Addr{}, err |
| } |
| ret[i] = uint8(val) |
| } |
| return AddrFrom4([4]byte{ret[0], ret[1], ret[2], ret[3]}), nil |
| } |
| |
| // parseWord converts a 16-bit hex string into its corresponding |
| // two-byte value. |
| func parseWord(s string) (byte, byte, error) { |
| ret, err := strconv.ParseUint(s, 16, 16) |
| if err != nil { |
| return 0, 0, err |
| } |
| return uint8(ret >> 8), uint8(ret), nil |
| } |