src/pkg/go/doc/comment.go - go - Git at Google

 // Copyright 2009 The Go Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.

 // Godoc comment extraction and comment -> HTML formatting.

 package doc

 import (
 	"fmt";
 	"io";
 	"once";
 	"regexp";
 	"strings";
 	"template";	// for htmlEscape
 )

 // Comment extraction

 var (
 	comment_markers *regexp.Regexp;
 	trailing_whitespace *regexp.Regexp;
 	comment_junk *regexp.Regexp;
 )

 func makeRex(s string) *regexp.Regexp {
 	re, err := regexp.Compile(s);
 	if err != nil {
 		panic("MakeRegexp ", s, " ", err.String());
 	}
 	return re;
 }

 // TODO(rsc): Cannot use var initialization for regexps,
 // because Regexp constructor needs threads.
 func setupRegexps() {
 	comment_markers = makeRex("^/(/|\\*) ?");
 	trailing_whitespace = makeRex("[ \t\r]+$");
 	comment_junk = makeRex("^[ \t]*(/\\*|\\*/)[ \t]*$");
 }

 // Aggregate comment text, without comment markers.
 func commentText(comments []string) string {
 	once.Do(setupRegexps);
 	lines := make([]string, 0, 20);
 	for i, c := range comments {
 		// split on newlines
 		cl := strings.Split(c, "\n", 0);

 		// walk lines, stripping comment markers
 		w := 0;
 		for j, l := range cl {
 			// remove /* and */ lines
 			if comment_junk.Match(l) {
 				continue;
 			}

 			// strip trailing white space
 			m := trailing_whitespace.Execute(l);
 			if len(m) > 0 {
 				l = l[0 : m[1]];
 			}

 			// strip leading comment markers
 			m = comment_markers.Execute(l);
 			if len(m) > 0 {
 				l = l[m[1] : len(l)];
 			}

 			// throw away leading blank lines
 			if w == 0 && l == "" {
 				continue;
 			}

 			cl[w] = l;
 			w++;
 		}

 		// throw away trailing blank lines
 		for w > 0 && cl[w-1] == "" {
 			w--;
 		}
 		cl = cl[0 : w];

 		// add this comment to total list
 		// TODO: maybe separate with a single blank line
 		// if there is already a comment and len(cl) > 0?
 		for j, l := range cl {
 			n := len(lines);
 			if n+1 >= cap(lines) {
 				newlines := make([]string, n, 2*cap(lines));
 				for k := range newlines {
 					newlines[k] = lines[k];
 				}
 				lines = newlines;
 			}
 			lines = lines[0 : n+1];
 			lines[n] = l;
 		}
 	}

 	// add final "" entry to get trailing newline.
 	// loop always leaves room for one more.
 	n := len(lines);
 	lines = lines[0 : n+1];

 	return strings.Join(lines, "\n");
 }

 // Split bytes into lines.
 func split(text []byte) [][]byte {
 	// count lines
 	n := 0;
 	last := 0;
 	for i, c := range text {
 		if c == '\n' {
 			last = i+1;
 			n++;
 		}
 	}
 	if last < len(text) {
 		n++;
 	}

 	// split
 	out := make([][]byte, n);
 	last = 0;
 	n = 0;
 	for i, c := range text {
 		if c == '\n' {
 			out[n] = text[last : i+1];
 			last = i+1;
 			n++;
 		}
 	}
 	if last < len(text) {
 		out[n] = text[last : len(text)];
 	}

 	return out;
 }


 var (
 	ldquo = io.StringBytes("&ldquo;");
 	rdquo = io.StringBytes("&rdquo;");
 )

 // Escape comment text for HTML.
 // Also, turn `` into &ldquo; and '' into &rdquo;.
 func commentEscape(w io.Writer, s []byte) {
 	last := 0;
 	for i := 0; i < len(s)-1; i++ {
 		if s[i] == s[i+1] && (s[i] == '`' || s[i] == '\'') {
 			template.HtmlEscape(w, s[last : i]);
 			last = i+2;
 			switch s[i] {
 			case '`':
 				w.Write(ldquo);
 			case '\'':
 				w.Write(rdquo);
 			}
 			i++;	// loop will add one more
 		}
 	}
 	template.HtmlEscape(w, s[last : len(s)]);
 }


 var (
 	html_p = io.StringBytes("<p>\n");
 	html_endp = io.StringBytes("</p>\n");
 	html_pre = io.StringBytes("<pre>");
 	html_endpre = io.StringBytes("</pre>\n");
 )


 func indentLen(s []byte) int {
 	i := 0;
 	for i < len(s) && (s[i] == ' ' || s[i] == '\t') {
 		i++;
 	}
 	return i;
 }


 func isBlank(s []byte) bool {
 	return len(s) == 0 || (len(s) == 1 && s[0] == '\n')
 }


 func commonPrefix(a, b []byte) []byte {
 	i := 0;
 	for i < len(a) && i < len(b) && a[i] == b[i] {
 		i++;
 	}
 	return a[0 : i];
 }


 func unindent(block [][]byte) {
 	if len(block) == 0 {
 		return;
 	}

 	// compute maximum common white prefix
 	prefix := block[0][0 : indentLen(block[0])];
 	for i, line := range block {
 		if !isBlank(line) {
 			prefix = commonPrefix(prefix, line[0 : indentLen(line)]);
 		}
 	}
 	n := len(prefix);

 	// remove
 	for i, line := range block {
 		if !isBlank(line) {
 			block[i] = line[n : len(line)];
 		}
 	}
 }


 // Convert comment text to formatted HTML.
 // The comment was prepared by DocReader,
 // so it is known not to have leading, trailing blank lines
 // nor to have trailing spaces at the end of lines.
 // The comment markers have already been removed.
 //
 // Turn each run of multiple \n into </p><p>
 // Turn each run of indented lines into <pre> without indent.
 //
 // TODO(rsc): I'd like to pass in an array of variable names []string
 // and then italicize those strings when they appear as words.
 func ToHtml(w io.Writer, s []byte) {
 	inpara := false;

 	/* TODO(rsc): 6g cant generate code for these
 	close := func() {
 		if inpara {
 			w.Write(html_endp);
 			inpara = false;
 		}
 	};
 	open := func() {
 		if !inpara {
 			w.Write(html_p);
 			inpara = true;
 		}
 	};
 	*/

 	lines := split(s);
 	unindent(lines);
 	for i := 0; i < len(lines);  {
 		line := lines[i];
 		if isBlank(line) {
 			// close paragraph
 			if inpara {
 				w.Write(html_endp);
 				inpara = false;
 			}
 			i++;
 			continue;
 		}
 		if indentLen(line) > 0 {
 			// close paragraph
 			if inpara {
 				w.Write(html_endp);
 				inpara = false;
 			}

 			// count indented or blank lines
 			j := i+1;
 			for j < len(lines) && (isBlank(lines[j]) || indentLen(lines[j]) > 0) {
 				j++;
 			}
 			// but not trailing blank lines
 			for j > i && isBlank(lines[j-1]) {
 				j--;
 			}
 			block := lines[i : j];
 			i = j;

 			unindent(block);

 			// put those lines in a pre block.
 			// they don't get the nice text formatting,
 			// just html escaping
 			w.Write(html_pre);
 			for k, line := range block {
 				template.HtmlEscape(w, line);
 			}
 			w.Write(html_endpre);
 			continue;
 		}
 		// open paragraph
 		if !inpara {
 			w.Write(html_p);
 			inpara = true;
 		}
 		commentEscape(w, lines[i]);
 		i++;
 	}
 	if inpara {
 		w.Write(html_endp);
 		inpara = false;
 	}
 }
	// Copyright 2009 The Go Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style
	// license that can be found in the LICENSE file.

	// Godoc comment extraction and comment -> HTML formatting.

	package doc

	import (
	"fmt";
	"io";
	"once";
	"regexp";
	"strings";
	"template"; // for htmlEscape
	)

	// Comment extraction

	var (
	comment_markers *regexp.Regexp;
	trailing_whitespace *regexp.Regexp;
	comment_junk *regexp.Regexp;
	)

	func makeRex(s string) *regexp.Regexp {
	re, err := regexp.Compile(s);
	if err != nil {
	panic("MakeRegexp ", s, " ", err.String());
	}
	return re;
	}

	// TODO(rsc): Cannot use var initialization for regexps,
	// because Regexp constructor needs threads.
	func setupRegexps() {
	comment_markers = makeRex("^/(/\|\\*) ?");
	trailing_whitespace = makeRex("[ \t\r]+$");
	comment_junk = makeRex("^[ \t](/\\\|\\/)[ \t]$");
	}

	// Aggregate comment text, without comment markers.
	func commentText(comments []string) string {
	once.Do(setupRegexps);
	lines := make([]string, 0, 20);
	for i, c := range comments {
	// split on newlines
	cl := strings.Split(c, "\n", 0);

	// walk lines, stripping comment markers
	w := 0;
	for j, l := range cl {
	// remove /* and */ lines
	if comment_junk.Match(l) {
	continue;
	}

	// strip trailing white space
	m := trailing_whitespace.Execute(l);
	if len(m) > 0 {
	l = l[0 : m[1]];
	}

	// strip leading comment markers
	m = comment_markers.Execute(l);
	if len(m) > 0 {
	l = l[m[1] : len(l)];
	}

	// throw away leading blank lines
	if w == 0 && l == "" {
	continue;
	}

	cl[w] = l;
	w++;
	}

	// throw away trailing blank lines
	for w > 0 && cl[w-1] == "" {
	w--;
	}
	cl = cl[0 : w];

	// add this comment to total list
	// TODO: maybe separate with a single blank line
	// if there is already a comment and len(cl) > 0?
	for j, l := range cl {
	n := len(lines);
	if n+1 >= cap(lines) {
	newlines := make([]string, n, 2*cap(lines));
	for k := range newlines {
	newlines[k] = lines[k];
	}
	lines = newlines;
	}
	lines = lines[0 : n+1];
	lines[n] = l;
	}
	}

	// add final "" entry to get trailing newline.
	// loop always leaves room for one more.
	n := len(lines);
	lines = lines[0 : n+1];

	return strings.Join(lines, "\n");
	}

	// Split bytes into lines.
	func split(text []byte) [][]byte {
	// count lines
	n := 0;
	last := 0;
	for i, c := range text {
	if c == '\n' {
	last = i+1;
	n++;
	}
	}
	if last < len(text) {
	n++;
	}

	// split
	out := make([][]byte, n);
	last = 0;
	n = 0;
	for i, c := range text {
	if c == '\n' {
	out[n] = text[last : i+1];
	last = i+1;
	n++;
	}
	}
	if last < len(text) {
	out[n] = text[last : len(text)];
	}

	return out;
	}


	var (
	ldquo = io.StringBytes("“");
	rdquo = io.StringBytes("”");
	)

	// Escape comment text for HTML.
	// Also, turn `` into “ and '' into ”.
	func commentEscape(w io.Writer, s []byte) {
	last := 0;
	for i := 0; i < len(s)-1; i++ {
	if s[i] == s[i+1] && (s[i] == '`' \|\| s[i] == '\'') {
	template.HtmlEscape(w, s[last : i]);
	last = i+2;
	switch s[i] {
	case '`':
	w.Write(ldquo);
	case '\'':
	w.Write(rdquo);
	}
	i++; // loop will add one more
	}
	}
	template.HtmlEscape(w, s[last : len(s)]);
	}


	var (
	html_p = io.StringBytes("<p>\n");
	html_endp = io.StringBytes("</p>\n");
	html_pre = io.StringBytes("<pre>");
	html_endpre = io.StringBytes("</pre>\n");
	)


	func indentLen(s []byte) int {
	i := 0;
	for i < len(s) && (s[i] == ' ' \|\| s[i] == '\t') {
	i++;
	}
	return i;
	}


	func isBlank(s []byte) bool {
	return len(s) == 0 \|\| (len(s) == 1 && s[0] == '\n')
	}


	func commonPrefix(a, b []byte) []byte {
	i := 0;
	for i < len(a) && i < len(b) && a[i] == b[i] {
	i++;
	}
	return a[0 : i];
	}


	func unindent(block [][]byte) {
	if len(block) == 0 {
	return;
	}

	// compute maximum common white prefix
	prefix := block[0][0 : indentLen(block[0])];
	for i, line := range block {
	if !isBlank(line) {
	prefix = commonPrefix(prefix, line[0 : indentLen(line)]);
	}
	}
	n := len(prefix);

	// remove
	for i, line := range block {
	if !isBlank(line) {
	block[i] = line[n : len(line)];
	}
	}
	}


	// Convert comment text to formatted HTML.
	// The comment was prepared by DocReader,
	// so it is known not to have leading, trailing blank lines
	// nor to have trailing spaces at the end of lines.
	// The comment markers have already been removed.
	//
	// Turn each run of multiple \n into </p><p>
	// Turn each run of indented lines into <pre> without indent.
	//
	// TODO(rsc): I'd like to pass in an array of variable names []string
	// and then italicize those strings when they appear as words.
	func ToHtml(w io.Writer, s []byte) {
	inpara := false;

	/* TODO(rsc): 6g cant generate code for these
	close := func() {
	if inpara {
	w.Write(html_endp);
	inpara = false;
	}
	};
	open := func() {
	if !inpara {
	w.Write(html_p);
	inpara = true;
	}
	};
	*/

	lines := split(s);
	unindent(lines);
	for i := 0; i < len(lines); {
	line := lines[i];
	if isBlank(line) {
	// close paragraph
	if inpara {
	w.Write(html_endp);
	inpara = false;
	}
	i++;
	continue;
	}
	if indentLen(line) > 0 {
	// close paragraph
	if inpara {
	w.Write(html_endp);
	inpara = false;
	}

	// count indented or blank lines
	j := i+1;
	for j < len(lines) && (isBlank(lines[j]) \|\| indentLen(lines[j]) > 0) {
	j++;
	}
	// but not trailing blank lines
	for j > i && isBlank(lines[j-1]) {
	j--;
	}
	block := lines[i : j];
	i = j;

	unindent(block);

	// put those lines in a pre block.
	// they don't get the nice text formatting,
	// just html escaping
	w.Write(html_pre);
	for k, line := range block {
	template.HtmlEscape(w, line);
	}
	w.Write(html_endpre);
	continue;
	}
	// open paragraph
	if !inpara {
	w.Write(html_p);
	inpara = true;
	}
	commentEscape(w, lines[i]);
	i++;
	}
	if inpara {
	w.Write(html_endp);
	inpara = false;
	}
	}