tool/src/test/java/org/antlr/test/TestLexer.java - platform/external/antlr - Git at Google

 /*
  * [The "BSD license"]
  *  Copyright (c) 2010 Terence Parr
  *  All rights reserved.
  *
  *  Redistribution and use in source and binary forms, with or without
  *  modification, are permitted provided that the following conditions
  *  are met:
  *  1. Redistributions of source code must retain the above copyright
  *      notice, this list of conditions and the following disclaimer.
  *  2. Redistributions in binary form must reproduce the above copyright
  *      notice, this list of conditions and the following disclaimer in the
  *      documentation and/or other materials provided with the distribution.
  *  3. The name of the author may not be used to endorse or promote products
  *      derived from this software without specific prior written permission.
  *
  *  THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
  *  IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  *  OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
  *  IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
  *  INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
  *  NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  *  DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  *  THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  *  (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
  *  THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  */
 package org.antlr.test;

 import org.antlr.Tool;
 import org.antlr.codegen.CodeGenerator;
 import org.stringtemplate.v4.ST;
 import org.antlr.tool.Grammar;
 import org.junit.Test;

 import static org.junit.Assert.*;

 public class TestLexer extends BaseTest {
 	protected boolean debug = false;

 	/** Public default constructor used by TestRig */
 	public TestLexer() {
 	}

 	@Test public void testSetText() throws Exception {
 		// this must return A not I to the parser; calling a nonfragment rule
 		// from a nonfragment rule does not set the overall token.
 		String grammar =
 			"grammar P;\n"+
 			"a : A {System.out.println(input);} ;\n"+
 			"A : '\\\\' 't' {setText(\"\t\");} ;\n" +
 			"WS : (' '|'\\n') {$channel=HIDDEN;} ;";
 		String found = execParser("P.g", grammar, "PParser", "PLexer",
 				    "a", "\\t", debug);
 		assertEquals("\t\n", found);
 	}

 	@Test public void testRefToRuleDoesNotSetTokenNorEmitAnother() throws Exception {
 		// this must return A not I to the parser; calling a nonfragment rule
 		// from a nonfragment rule does not set the overall token.
 		String grammar =
 			"grammar P;\n"+
 			"a : A EOF {System.out.println(input);} ;\n"+
 			"A : '-' I ;\n" +
 			"I : '0'..'9'+ ;\n"+
 			"WS : (' '|'\\n') {$channel=HIDDEN;} ;";
 		String found = execParser("P.g", grammar, "PParser", "PLexer",
 				    "a", "-34", debug);
 		assertEquals("-34\n", found);
 	}

 	@Test public void testRefToRuleDoesNotSetChannel() throws Exception {
 		// this must set channel of A to HIDDEN.  $channel is local to rule
 		// like $type.
 		String grammar =
 			"grammar P;\n"+
 			"a : A EOF {System.out.println($A.text+\", channel=\"+$A.channel);} ;\n"+
 			"A : '-' WS I ;\n" +
 			"I : '0'..'9'+ ;\n"+
 			"WS : (' '|'\\n') {$channel=HIDDEN;} ;";
 		String found = execParser("P.g", grammar, "PParser", "PLexer",
 				    "a", "- 34", debug);
 		assertEquals("- 34, channel=0\n", found);
 	}

 	@Test public void testWeCanSetType() throws Exception {
 		String grammar =
 			"grammar P;\n"+
 			"tokens {X;}\n" +
 			"a : X EOF {System.out.println(input);} ;\n"+
 			"A : '-' I {$type = X;} ;\n" +
 			"I : '0'..'9'+ ;\n"+
 			"WS : (' '|'\\n') {$channel=HIDDEN;} ;";
 		String found = execParser("P.g", grammar, "PParser", "PLexer",
 				    "a", "-34", debug);
 		assertEquals("-34\n", found);
 	}

 	@Test public void testRefToFragment() throws Exception {
 		// this must return A not I to the parser; calling a nonfragment rule
 		// from a nonfragment rule does not set the overall token.
 		String grammar =
 			"grammar P;\n"+
 			"a : A {System.out.println(input);} ;\n"+
 			"A : '-' I ;\n" +
 			"fragment I : '0'..'9'+ ;\n"+
 			"WS : (' '|'\\n') {$channel=HIDDEN;} ;";
 		String found = execParser("P.g", grammar, "PParser", "PLexer",
 				    "a", "-34", debug);
 		assertEquals("-34\n", found);
 	}

 	@Test public void testMultipleRefToFragment() throws Exception {
 		// this must return A not I to the parser; calling a nonfragment rule
 		// from a nonfragment rule does not set the overall token.
 		String grammar =
 			"grammar P;\n"+
 			"a : A EOF {System.out.println(input);} ;\n"+
 			"A : I '.' I ;\n" +
 			"fragment I : '0'..'9'+ ;\n"+
 			"WS : (' '|'\\n') {$channel=HIDDEN;} ;";
 		String found = execParser("P.g", grammar, "PParser", "PLexer",
 				    "a", "3.14159", debug);
 		assertEquals("3.14159\n", found);
 	}

 	@Test public void testLabelInSubrule() throws Exception {
 		// can we see v outside?
 		String grammar =
 			"grammar P;\n"+
 			"a : A EOF ;\n"+
 			"A : 'hi' WS (v=I)? {$channel=0; System.out.println($v.text);} ;\n" +
 			"fragment I : '0'..'9'+ ;\n"+
 			"WS : (' '|'\\n') {$channel=HIDDEN;} ;";
 		String found = execParser("P.g", grammar, "PParser", "PLexer",
 				    "a", "hi 342", debug);
 		assertEquals("342\n", found);
 	}

 	@Test public void testRefToTokenInLexer() throws Exception {
 		String grammar =
 			"grammar P;\n"+
 			"a : A EOF ;\n"+
 			"A : I {System.out.println($I.text);} ;\n" +
 			"fragment I : '0'..'9'+ ;\n"+
 			"WS : (' '|'\\n') {$channel=HIDDEN;} ;";
 		String found = execParser("P.g", grammar, "PParser", "PLexer",
 				    "a", "342", debug);
 		assertEquals("342\n", found);
 	}

 	@Test public void testListLabelInLexer() throws Exception {
 		String grammar =
 			"grammar P;\n"+
 			"a : A ;\n"+
 			"A : i+=I+ {for (Object t : $i) System.out.print(\" \"+((Token)t).getText());} ;\n" +
 			"fragment I : '0'..'9'+ ;\n"+
 			"WS : (' '|'\\n') {$channel=HIDDEN;} ;";
 		String found = execParser("P.g", grammar, "PParser", "PLexer",
 				    "a", "33 297", debug);
 		assertEquals(" 33 297\n", found);
 	}

 	@Test public void testDupListRefInLexer() throws Exception {
 		String grammar =
 			"grammar P;\n"+
 			"a : A ;\n"+
 			"A : i+=I WS i+=I {$channel=0; for (Object t : $i) System.out.print(\" \"+((Token)t).getText());} ;\n" +
 			"fragment I : '0'..'9'+ ;\n"+
 			"WS : (' '|'\\n') {$channel=HIDDEN;} ;";
 		String found = execParser("P.g", grammar, "PParser", "PLexer",
 				    "a", "33 297", debug);
 		assertEquals(" 33 297\n", found);
 	}

 	@Test public void testCharLabelInLexer() {
 		String grammar =
 			"grammar T;\n" +
 			"a : B ;\n" +
 			"B : x='a' {System.out.println((char)$x);} ;\n" ;
 		String found = execParser("T.g", grammar, "TParser", "TLexer",
 								  "a", "a", debug);
 		assertEquals("a\n", found);
 	}

 	@Test public void testRepeatedLabelInLexer() {
 		String grammar =
 			"lexer grammar T;\n" +
 			"B : x='a' x='b' ;\n" ;
 		boolean found =
 			rawGenerateAndBuildRecognizer(
 				"T.g", grammar, null, "T", false);
 		boolean expecting = true; // should be ok
 		assertEquals(expecting, found);
 	}

 	@Test public void testRepeatedRuleLabelInLexer() {
 		String grammar =
 			"lexer grammar T;\n" +
 			"B : x=A x=A ;\n" +
 			"fragment A : 'a' ;\n" ;
 		boolean found =
 			rawGenerateAndBuildRecognizer(
 				"T.g", grammar, null, "T", false);
 		boolean expecting = true; // should be ok
 		assertEquals(expecting, found);
 	}

 	@Test public void testIsolatedEOTEdge() {
 		String grammar =
 			"lexer grammar T;\n" +
 			"QUOTED_CONTENT \n" +
 			"        : 'q' (~'q')* (('x' 'q') )* 'q' ; \n";
 		boolean found =
 			rawGenerateAndBuildRecognizer(
 				"T.g", grammar, null, "T", false);
 		boolean expecting = true; // should be ok
 		assertEquals(expecting, found);
 	}

 	@Test public void testEscapedLiterals() {
 		/* Grammar:
 			A : '\"' ;  should match a single double-quote: "
 			B : '\\\"' ; should match input \"
 		*/
 		String grammar =
 			"lexer grammar T;\n" +
 			"A : '\\\"' ;\n" +
 			"B : '\\\\\\\"' ;\n" ; // '\\\"'
 		boolean found =
 			rawGenerateAndBuildRecognizer(
 				"T.g", grammar, null, "T", false);
 		boolean expecting = true; // should be ok
 		assertEquals(expecting, found);
 	}

     @Test public void testNewlineLiterals() throws Exception {
         Grammar g = new Grammar(
             "lexer grammar T;\n" +
             "A : '\\n\\n' ;\n"  // ANTLR sees '\n\n'
         );
         String expecting = "match(\"\\n\\n\")";

         Tool antlr = newTool();
         antlr.setOutputDirectory(null); // write to /dev/null
         CodeGenerator generator = new CodeGenerator(antlr, g, "Java");
         g.setCodeGenerator(generator);
         generator.genRecognizer(); // codegen phase sets some vars we need
         ST codeST = generator.getRecognizerST();
         String code = codeST.render();
         int m = code.indexOf("match(\"");
         String found = code.substring(m,m+expecting.length());

         assertEquals(expecting, found);
     }
 }
	/*
	* [The "BSD license"]
	* Copyright (c) 2010 Terence Parr
	* All rights reserved.
	*
	* Redistribution and use in source and binary forms, with or without
	* modification, are permitted provided that the following conditions
	* are met:
	* 1. Redistributions of source code must retain the above copyright
	* notice, this list of conditions and the following disclaimer.
	* 2. Redistributions in binary form must reproduce the above copyright
	* notice, this list of conditions and the following disclaimer in the
	* documentation and/or other materials provided with the distribution.
	* 3. The name of the author may not be used to endorse or promote products
	* derived from this software without specific prior written permission.
	*
	* THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
	* IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
	* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
	* IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
	* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
	* NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
	* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
	* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
	* THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
	*/
	package org.antlr.test;

	import org.antlr.Tool;
	import org.antlr.codegen.CodeGenerator;
	import org.stringtemplate.v4.ST;
	import org.antlr.tool.Grammar;
	import org.junit.Test;

	import static org.junit.Assert.*;

	public class TestLexer extends BaseTest {
	protected boolean debug = false;

	/** Public default constructor used by TestRig */
	public TestLexer() {
	}

	@Test public void testSetText() throws Exception {
	// this must return A not I to the parser; calling a nonfragment rule
	// from a nonfragment rule does not set the overall token.
	String grammar =
	"grammar P;\n"+
	"a : A {System.out.println(input);} ;\n"+
	"A : '\\\\' 't' {setText(\"\t\");} ;\n" +
	"WS : (' '\|'\\n') {$channel=HIDDEN;} ;";
	String found = execParser("P.g", grammar, "PParser", "PLexer",
	"a", "\\t", debug);
	assertEquals("\t\n", found);
	}

	@Test public void testRefToRuleDoesNotSetTokenNorEmitAnother() throws Exception {
	// this must return A not I to the parser; calling a nonfragment rule
	// from a nonfragment rule does not set the overall token.
	String grammar =
	"grammar P;\n"+
	"a : A EOF {System.out.println(input);} ;\n"+
	"A : '-' I ;\n" +
	"I : '0'..'9'+ ;\n"+
	"WS : (' '\|'\\n') {$channel=HIDDEN;} ;";
	String found = execParser("P.g", grammar, "PParser", "PLexer",
	"a", "-34", debug);
	assertEquals("-34\n", found);
	}

	@Test public void testRefToRuleDoesNotSetChannel() throws Exception {
	// this must set channel of A to HIDDEN. $channel is local to rule
	// like $type.
	String grammar =
	"grammar P;\n"+
	"a : A EOF {System.out.println($A.text+\", channel=\"+$A.channel);} ;\n"+
	"A : '-' WS I ;\n" +
	"I : '0'..'9'+ ;\n"+
	"WS : (' '\|'\\n') {$channel=HIDDEN;} ;";
	String found = execParser("P.g", grammar, "PParser", "PLexer",
	"a", "- 34", debug);
	assertEquals("- 34, channel=0\n", found);
	}

	@Test public void testWeCanSetType() throws Exception {
	String grammar =
	"grammar P;\n"+
	"tokens {X;}\n" +
	"a : X EOF {System.out.println(input);} ;\n"+
	"A : '-' I {$type = X;} ;\n" +
	"I : '0'..'9'+ ;\n"+
	"WS : (' '\|'\\n') {$channel=HIDDEN;} ;";
	String found = execParser("P.g", grammar, "PParser", "PLexer",
	"a", "-34", debug);
	assertEquals("-34\n", found);
	}

	@Test public void testRefToFragment() throws Exception {
	// this must return A not I to the parser; calling a nonfragment rule
	// from a nonfragment rule does not set the overall token.
	String grammar =
	"grammar P;\n"+
	"a : A {System.out.println(input);} ;\n"+
	"A : '-' I ;\n" +
	"fragment I : '0'..'9'+ ;\n"+
	"WS : (' '\|'\\n') {$channel=HIDDEN;} ;";
	String found = execParser("P.g", grammar, "PParser", "PLexer",
	"a", "-34", debug);
	assertEquals("-34\n", found);
	}

	@Test public void testMultipleRefToFragment() throws Exception {
	// this must return A not I to the parser; calling a nonfragment rule
	// from a nonfragment rule does not set the overall token.
	String grammar =
	"grammar P;\n"+
	"a : A EOF {System.out.println(input);} ;\n"+
	"A : I '.' I ;\n" +
	"fragment I : '0'..'9'+ ;\n"+
	"WS : (' '\|'\\n') {$channel=HIDDEN;} ;";
	String found = execParser("P.g", grammar, "PParser", "PLexer",
	"a", "3.14159", debug);
	assertEquals("3.14159\n", found);
	}

	@Test public void testLabelInSubrule() throws Exception {
	// can we see v outside?
	String grammar =
	"grammar P;\n"+
	"a : A EOF ;\n"+
	"A : 'hi' WS (v=I)? {$channel=0; System.out.println($v.text);} ;\n" +
	"fragment I : '0'..'9'+ ;\n"+
	"WS : (' '\|'\\n') {$channel=HIDDEN;} ;";
	String found = execParser("P.g", grammar, "PParser", "PLexer",
	"a", "hi 342", debug);
	assertEquals("342\n", found);
	}

	@Test public void testRefToTokenInLexer() throws Exception {
	String grammar =
	"grammar P;\n"+
	"a : A EOF ;\n"+
	"A : I {System.out.println($I.text);} ;\n" +
	"fragment I : '0'..'9'+ ;\n"+
	"WS : (' '\|'\\n') {$channel=HIDDEN;} ;";
	String found = execParser("P.g", grammar, "PParser", "PLexer",
	"a", "342", debug);
	assertEquals("342\n", found);
	}

	@Test public void testListLabelInLexer() throws Exception {
	String grammar =
	"grammar P;\n"+
	"a : A ;\n"+
	"A : i+=I+ {for (Object t : $i) System.out.print(\" \"+((Token)t).getText());} ;\n" +
	"fragment I : '0'..'9'+ ;\n"+
	"WS : (' '\|'\\n') {$channel=HIDDEN;} ;";
	String found = execParser("P.g", grammar, "PParser", "PLexer",
	"a", "33 297", debug);
	assertEquals(" 33 297\n", found);
	}

	@Test public void testDupListRefInLexer() throws Exception {
	String grammar =
	"grammar P;\n"+
	"a : A ;\n"+
	"A : i+=I WS i+=I {$channel=0; for (Object t : $i) System.out.print(\" \"+((Token)t).getText());} ;\n" +
	"fragment I : '0'..'9'+ ;\n"+
	"WS : (' '\|'\\n') {$channel=HIDDEN;} ;";
	String found = execParser("P.g", grammar, "PParser", "PLexer",
	"a", "33 297", debug);
	assertEquals(" 33 297\n", found);
	}

	@Test public void testCharLabelInLexer() {
	String grammar =
	"grammar T;\n" +
	"a : B ;\n" +
	"B : x='a' {System.out.println((char)$x);} ;\n" ;
	String found = execParser("T.g", grammar, "TParser", "TLexer",
	"a", "a", debug);
	assertEquals("a\n", found);
	}

	@Test public void testRepeatedLabelInLexer() {
	String grammar =
	"lexer grammar T;\n" +
	"B : x='a' x='b' ;\n" ;
	boolean found =
	rawGenerateAndBuildRecognizer(
	"T.g", grammar, null, "T", false);
	boolean expecting = true; // should be ok
	assertEquals(expecting, found);
	}

	@Test public void testRepeatedRuleLabelInLexer() {
	String grammar =
	"lexer grammar T;\n" +
	"B : x=A x=A ;\n" +
	"fragment A : 'a' ;\n" ;
	boolean found =
	rawGenerateAndBuildRecognizer(
	"T.g", grammar, null, "T", false);
	boolean expecting = true; // should be ok
	assertEquals(expecting, found);
	}

	@Test public void testIsolatedEOTEdge() {
	String grammar =
	"lexer grammar T;\n" +
	"QUOTED_CONTENT \n" +
	" : 'q' (~'q')* (('x' 'q') )* 'q' ; \n";
	boolean found =
	rawGenerateAndBuildRecognizer(
	"T.g", grammar, null, "T", false);
	boolean expecting = true; // should be ok
	assertEquals(expecting, found);
	}

	@Test public void testEscapedLiterals() {
	/* Grammar:
	A : '\"' ; should match a single double-quote: "
	B : '\\\"' ; should match input \"
	*/
	String grammar =
	"lexer grammar T;\n" +
	"A : '\\\"' ;\n" +
	"B : '\\\\\\\"' ;\n" ; // '\\\"'
	boolean found =
	rawGenerateAndBuildRecognizer(
	"T.g", grammar, null, "T", false);
	boolean expecting = true; // should be ok
	assertEquals(expecting, found);
	}

	@Test public void testNewlineLiterals() throws Exception {
	Grammar g = new Grammar(
	"lexer grammar T;\n" +
	"A : '\\n\\n' ;\n" // ANTLR sees '\n\n'
	);
	String expecting = "match(\"\\n\\n\")";

	Tool antlr = newTool();
	antlr.setOutputDirectory(null); // write to /dev/null
	CodeGenerator generator = new CodeGenerator(antlr, g, "Java");
	g.setCodeGenerator(generator);
	generator.genRecognizer(); // codegen phase sets some vars we need
	ST codeST = generator.getRecognizerST();
	String code = codeST.render();
	int m = code.indexOf("match(\"");
	String found = code.substring(m,m+expecting.length());

	assertEquals(expecting, found);
	}
	}