Commit 20430f03 authored by Robert Griesemer's avatar Robert Griesemer

go/scanner: treat EOF like a newline for purposes of semicolon insertion

R=rsc
CC=golang-dev
https://golang.org/cl/2216054
parent b4e358d7
...@@ -196,26 +196,27 @@ func (S *Scanner) scanComment(pos token.Position) { ...@@ -196,26 +196,27 @@ func (S *Scanner) scanComment(pos token.Position) {
} }
func (S *Scanner) findNewline(pos token.Position) bool { func (S *Scanner) findLineEnd(pos token.Position) bool {
// first '/' already consumed; assume S.ch == '/' || S.ch == '*' // first '/' already consumed; assume S.ch == '/' || S.ch == '*'
// read ahead until a newline or non-comment token is found // read ahead until a newline, EOF, or non-comment token is found
newline := false lineend := false
for pos1 := pos; S.ch >= 0; { for pos1 := pos; S.ch >= 0; {
if S.ch == '/' { if S.ch == '/' {
//-style comment always contains a newline //-style comment always contains a newline
newline = true lineend = true
break break
} }
S.scanComment(pos1) S.scanComment(pos1)
if pos1.Line < S.pos.Line { if pos1.Line < S.pos.Line {
/*-style comment contained a newline */ /*-style comment contained a newline */
newline = true lineend = true
break break
} }
S.skipWhitespace() // S.insertSemi is set S.skipWhitespace() // S.insertSemi is set
if S.ch == '\n' { if S.ch < 0 || S.ch == '\n' {
newline = true // line end
lineend = true
break break
} }
if S.ch != '/' { if S.ch != '/' {
...@@ -230,12 +231,12 @@ func (S *Scanner) findNewline(pos token.Position) bool { ...@@ -230,12 +231,12 @@ func (S *Scanner) findNewline(pos token.Position) bool {
} }
} }
// reset position to where it was upon calling findNewline // reset position to where it was upon calling findLineEnd
S.pos = pos S.pos = pos
S.offset = pos.Offset + 1 S.offset = pos.Offset + 1
S.next() S.next()
return newline return lineend
} }
...@@ -507,7 +508,8 @@ var newline = []byte{'\n'} ...@@ -507,7 +508,8 @@ var newline = []byte{'\n'}
// //
// If the returned token is token.SEMICOLON, the corresponding // If the returned token is token.SEMICOLON, the corresponding
// literal value is ";" if the semicolon was present in the source, // literal value is ";" if the semicolon was present in the source,
// and "\n" if the semicolon was inserted because of a newline. // and "\n" if the semicolon was inserted because of a newline or
// at EOF.
// //
// For more tolerant parsing, Scan will return a valid token if // For more tolerant parsing, Scan will return a valid token if
// possible even if a syntax error was encountered. Thus, even // possible even if a syntax error was encountered. Thus, even
...@@ -539,6 +541,10 @@ scanAgain: ...@@ -539,6 +541,10 @@ scanAgain:
S.next() // always make progress S.next() // always make progress
switch ch { switch ch {
case -1: case -1:
if S.insertSemi {
S.insertSemi = false // EOF consumed
return pos, token.SEMICOLON, newline
}
tok = token.EOF tok = token.EOF
case '\n': case '\n':
// we only reach here if S.insertSemi was // we only reach here if S.insertSemi was
...@@ -607,7 +613,7 @@ scanAgain: ...@@ -607,7 +613,7 @@ scanAgain:
case '/': case '/':
if S.ch == '/' || S.ch == '*' { if S.ch == '/' || S.ch == '*' {
// comment // comment
if S.insertSemi && S.findNewline(pos) { if S.insertSemi && S.findLineEnd(pos) {
// reset position to the beginning of the comment // reset position to the beginning of the comment
S.pos = pos S.pos = pos
S.offset = pos.Offset + 1 S.offset = pos.Offset + 1
......
...@@ -403,11 +403,10 @@ var lines = []string{ ...@@ -403,11 +403,10 @@ var lines = []string{
"foo $/*comment*/\n", "foo $/*comment*/\n",
"foo $/*\n*/", "foo $/*\n*/",
"foo $/*comment*/\n",
"foo $/*0*/ /*1*/ /*2*/\n", "foo $/*0*/ /*1*/ /*2*/\n",
"foo $/*comment*/ \n", "foo $/*comment*/ \n",
"foo $/*0*/ /*1*/ /*2*/ \n", "foo $/*0*/ /*1*/ /*2*/ \n",
"foo $/**/ /*-------------*/ /*----\n*/bar $/* \n*/baa", "foo $/**/ /*-------------*/ /*----\n*/bar $/* \n*/baa$\n",
"package main$\n\nfunc main() {\n\tif {\n\t\treturn /* */ }$\n}$\n", "package main$\n\nfunc main() {\n\tif {\n\t\treturn /* */ }$\n}$\n",
} }
...@@ -416,9 +415,14 @@ var lines = []string{ ...@@ -416,9 +415,14 @@ var lines = []string{
func TestSemis(t *testing.T) { func TestSemis(t *testing.T) {
for _, line := range lines { for _, line := range lines {
checkSemi(t, line, AllowIllegalChars|InsertSemis) checkSemi(t, line, AllowIllegalChars|InsertSemis)
}
for _, line := range lines {
checkSemi(t, line, AllowIllegalChars|InsertSemis|ScanComments) checkSemi(t, line, AllowIllegalChars|InsertSemis|ScanComments)
// if the input ended in newlines, the input must tokenize the
// same with or without those newlines
for i := len(line) - 1; i >= 0 && line[i] == '\n'; i-- {
checkSemi(t, line[0:i], AllowIllegalChars|InsertSemis)
checkSemi(t, line[0:i], AllowIllegalChars|InsertSemis|ScanComments)
}
} }
} }
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment