go/doc: convert to unicode quotes for ToText and Synopsis

We refactor the conversion of quotes to their unicode equivalent to a separate function so that it can be called from ToText and Synopsis. And we introduce a temp buffer to write the escaped HTML and convert the unicode quotes back to html escaped entities. This simplifies the logic and gets rid of the need to track the index of the escaped text. Fixes #27759 Change-Id: I71cf47ddcd4c6794ccdf2898ac25539388b393c1 Reviewed-on: https://go-review.googlesource.com/c/150377 Run-TryBot: Robert Griesemer <gri@golang.org> Reviewed-by: Robert Griesemer <gri@golang.org>

go/doc: convert to unicode quotes for ToText and Synopsis
We refactor the conversion of quotes to their unicode equivalent to a separate function so that it can be called from ToText and Synopsis. And we introduce a temp buffer to write the escaped HTML and convert the unicode quotes back to html escaped entities. This simplifies the logic and gets rid of the need to track the index of the escaped text. Fixes #27759 Change-Id: I71cf47ddcd4c6794ccdf2898ac25539388b393c1 Reviewed-on: https://go-review.googlesource.com/c/150377 Run-TryBot: Robert Griesemer <gri@golang.org> Reviewed-by: Robert Griesemer <gri@golang.org>
81a5c9c3 · Agniva De Sarker · Robert Griesemer · 689fae2d · 81a5c9c3 · 81a5c9c3
Commit 81a5c9c3 authored Nov 20, 2018 by Agniva De Sarker Committed by Robert Griesemer Nov 29, 2018
4 changed files
--- a/src/go/doc/comment.go
+++ b/src/go/doc/comment.go
@@ -7,6 +7,7 @@
 package doc
 import (
+	"bytes"
 	"io"
 	"strings"
 	"text/template" // for HTMLEscape
@@ -14,32 +15,38 @@ import (
 	"unicode/utf8"
 )
+const (
+	ldquo = "&ldquo;"
+	rdquo = "&rdquo;"
+	ulquo = "“"
+	urquo = "”"
+)
 var (
-	ldquo = []byte("&ldquo;")
+	htmlQuoteReplacer    = strings.NewReplacer(ulquo, ldquo, urquo, rdquo)
-	rdquo = []byte("&rdquo;")
+	unicodeQuoteReplacer = strings.NewReplacer("``", ulquo, "''", urquo)
 )
 // Escape comment text for HTML. If nice is set,
 // also turn `` into &ldquo; and '' into &rdquo;.
 func commentEscape(w io.Writer, text string, nice bool) {
-	last := 0
 	if nice {
-		for i := 0; i < len(text)-1; i++ {
+		// In the first pass, we convert `` and '' into their unicode equivalents.
-			ch := text[i]
+		// This prevents them from being escaped in HTMLEscape.
-			if ch == text[i+1] && (ch == '`' || ch == '\'') {
+		text = convertQuotes(text)
-				template.HTMLEscape(w, []byte(text[last:i]))
+		var buf bytes.Buffer
-				last = i + 2
+		template.HTMLEscape(&buf, []byte(text))
-				switch ch {
+		// Now we convert the unicode quotes to their HTML escaped entities to maintain old behavior.
-				case '`':
+		// We need to use a temp buffer to read the string back and do the conversion,
-					w.Write(ldquo)
+		// otherwise HTMLEscape will escape & to &amp;
-				case '\'':
+		htmlQuoteReplacer.WriteString(w, buf.String())
-					w.Write(rdquo)
+		return
-				}
-				i++ // loop will add one more
-			}
-		}
 	}
-	template.HTMLEscape(w, []byte(text[last:]))
+	template.HTMLEscape(w, []byte(text))
+}
+func convertQuotes(text string) string {
+	return unicodeQuoteReplacer.Replace(text)
 }
 const (
@@ -248,7 +255,7 @@ func heading(line string) string {
 	}
 	// allow "." when followed by non-space
-	for b := line;; {
+	for b := line; ; {
 		i := strings.IndexRune(b, '.')
 		if i < 0 {
 			break
@@ -429,12 +436,14 @@ func ToText(w io.Writer, text string, indent, preIndent string, width int) {
 		case opPara:
 			// l.write will add leading newline if required
 			for _, line := range b.lines {
+				line = convertQuotes(line)
 				l.write(line)
 			}
 			l.flush()
 		case opHead:
 			w.Write(nl)
 			for _, line := range b.lines {
+				line = convertQuotes(line)
 				l.write(line + "\n")
 			}
 			l.flush()
@@ -445,6 +454,7 @@ func ToText(w io.Writer, text string, indent, preIndent string, width int) {
 					w.Write([]byte("\n"))
 				} else {
 					w.Write([]byte(preIndent))
+					line = convertQuotes(line)
 					w.Write([]byte(line))
 				}
 			}

--- a/src/go/doc/comment_test.go
+++ b/src/go/doc/comment_test.go
@@ -7,6 +7,7 @@ package doc
 import (
 	"bytes"
 	"reflect"
+	"strings"
 	"testing"
 )
@@ -212,3 +213,20 @@ func TestPairedParensPrefixLen(t *testing.T) {
 		}
 	}
 }
+func TestCommentEscape(t *testing.T) {
+	commentTests := []struct {
+		in, out string
+	}{
+		{"typically invoked as ``go tool asm'',", "typically invoked as " + ldquo + "go tool asm" + rdquo + ","},
+		{"For more detail, run ``go help test'' and ``go help testflag''", "For more detail, run " + ldquo + "go help test" + rdquo + " and " + ldquo + "go help testflag" + rdquo},
+	}
+	for i, tt := range commentTests {
+		var buf strings.Builder
+		commentEscape(&buf, tt.in, true)
+		out := buf.String()
+		if out != tt.out {
+			t.Errorf("#%d: mismatch\nhave: %q\nwant: %q", i, out, tt.out)
+		}
+	}
+}
--- a/src/go/doc/synopsis.go
+++ b/src/go/doc/synopsis.go
@@ -72,6 +72,7 @@ func Synopsis(s string) string {
 			return ""
 		}
 	}
+	s = convertQuotes(s)
 	return s
 }

--- a/src/go/doc/synopsis_test.go
+++ b/src/go/doc/synopsis_test.go
@@ -35,6 +35,7 @@ var tests = []struct {
 	{"All Rights reserved. Package foo does bar.", 20, ""},
 	{"All rights reserved. Package foo does bar.", 20, ""},
 	{"Authors: foo@bar.com. Package foo does bar.", 21, ""},
+	{"typically invoked as ``go tool asm'',", 37, "typically invoked as " + ulquo + "go tool asm" + urquo + ","},
 }
 func TestSynopsis(t *testing.T) {