src/jdk.scripting.nashorn/share/classes/jdk/nashorn/internal/parser/JSONParser.java - toolchain/jdk/jdk9_nashorn - Git at Google

 /*
  * Copyright (c) 2010, 2013, Oracle and/or its affiliates. All rights reserved.
  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
  *
  * This code is free software; you can redistribute it and/or modify it
  * under the terms of the GNU General Public License version 2 only, as
  * published by the Free Software Foundation.  Oracle designates this
  * particular file as subject to the "Classpath" exception as provided
  * by Oracle in the LICENSE file that accompanied this code.
  *
  * This code is distributed in the hope that it will be useful, but WITHOUT
  * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
  * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU General Public License
  * version 2 for more details (a copy is included in the LICENSE file that
  * accompanied this code).
  *
  * You should have received a copy of the GNU General Public License version
  * 2 along with this work; if not, write to the Free Software Foundation,
  * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
  *
  * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
  * or visit www.oracle.com if you need additional information or have any
  * questions.
  */

 package jdk.nashorn.internal.parser;

 import static jdk.nashorn.internal.parser.TokenType.COLON;
 import static jdk.nashorn.internal.parser.TokenType.COMMARIGHT;
 import static jdk.nashorn.internal.parser.TokenType.EOF;
 import static jdk.nashorn.internal.parser.TokenType.ESCSTRING;
 import static jdk.nashorn.internal.parser.TokenType.RBRACE;
 import static jdk.nashorn.internal.parser.TokenType.RBRACKET;
 import static jdk.nashorn.internal.parser.TokenType.STRING;

 import java.util.ArrayList;
 import java.util.List;
 import jdk.nashorn.internal.ir.Expression;
 import jdk.nashorn.internal.ir.LiteralNode;
 import jdk.nashorn.internal.ir.Node;
 import jdk.nashorn.internal.ir.ObjectNode;
 import jdk.nashorn.internal.ir.PropertyNode;
 import jdk.nashorn.internal.ir.UnaryNode;
 import jdk.nashorn.internal.runtime.ErrorManager;
 import jdk.nashorn.internal.runtime.Source;

 /**
  * Parses JSON text and returns the corresponding IR node. This is derived from the objectLiteral production of the main parser.
  *
  * See: 15.12.1.2 The JSON Syntactic Grammar
  */
 public class JSONParser extends AbstractParser {

     /**
      * Constructor
      * @param source  the source
      * @param errors  the error manager
      */
     public JSONParser(final Source source, final ErrorManager errors) {
         super(source, errors, false, 0);
     }

     /**
      * Implementation of the Quote(value) operation as defined in the ECMA script spec
      * It wraps a String value in double quotes and escapes characters within in
      *
      * @param value string to quote
      *
      * @return quoted and escaped string
      */
     public static String quote(final String value) {

         final StringBuilder product = new StringBuilder();

         product.append("\"");

         for (final char ch : value.toCharArray()) {
             // TODO: should use a table?
             switch (ch) {
             case '\\':
                 product.append("\\\\");
                 break;
             case '"':
                 product.append("\\\"");
                 break;
             case '\b':
                 product.append("\\b");
                 break;
             case '\f':
                 product.append("\\f");
                 break;
             case '\n':
                 product.append("\\n");
                 break;
             case '\r':
                 product.append("\\r");
                 break;
             case '\t':
                 product.append("\\t");
                 break;
             default:
                 if (ch < ' ') {
                     product.append(Lexer.unicodeEscape(ch));
                     break;
                 }

                 product.append(ch);
                 break;
             }
         }

         product.append("\"");

         return product.toString();
     }

     /**
      * Public parsed method - start lexing a new token stream for
      * a JSON script
      *
      * @return the JSON literal
      */
     public Node parse() {
         stream = new TokenStream();

         lexer = new Lexer(source, stream) {

             @Override
             protected boolean skipComments() {
                 return false;
             }

             @Override
             protected boolean isStringDelimiter(final char ch) {
                 return ch == '\"';
             }

             // ECMA 15.12.1.1 The JSON Lexical Grammar - JSONWhiteSpace
             @Override
             protected boolean isWhitespace(final char ch) {
                 return Lexer.isJsonWhitespace(ch);
             }

             @Override
             protected boolean isEOL(final char ch) {
                 return Lexer.isJsonEOL(ch);
             }

             // ECMA 15.12.1.1 The JSON Lexical Grammar - JSONNumber
             @Override
             protected void scanNumber() {
                 // Record beginning of number.
                 final int startPosition = position;
                 // Assume value is a decimal.
                 TokenType valueType = TokenType.DECIMAL;

                 // floating point can't start with a "." with no leading digit before
                 if (ch0 == '.') {
                     error(Lexer.message("json.invalid.number"), STRING, position, limit);
                 }

                 // First digit of number.
                 final int digit = convertDigit(ch0, 10);

                 // skip first digit
                 skip(1);

                 if (digit != 0) {
                     // Skip over remaining digits.
                     while (convertDigit(ch0, 10) != -1) {
                         skip(1);
                     }
                 }

                 if (ch0 == '.' || ch0 == 'E' || ch0 == 'e') {
                     // Must be a double.
                     if (ch0 == '.') {
                         // Skip period.
                         skip(1);

                         boolean mantissa = false;
                         // Skip mantissa.
                         while (convertDigit(ch0, 10) != -1) {
                             mantissa = true;
                             skip(1);
                         }

                         if (! mantissa) {
                             // no digit after "."
                             error(Lexer.message("json.invalid.number"), STRING, position, limit);
                         }
                     }

                     // Detect exponent.
                     if (ch0 == 'E' || ch0 == 'e') {
                         // Skip E.
                         skip(1);
                         // Detect and skip exponent sign.
                         if (ch0 == '+' || ch0 == '-') {
                             skip(1);
                         }
                         boolean exponent = false;
                         // Skip exponent.
                         while (convertDigit(ch0, 10) != -1) {
                             exponent = true;
                             skip(1);
                         }

                         if (! exponent) {
                             // no digit after "E"
                             error(Lexer.message("json.invalid.number"), STRING, position, limit);
                         }
                     }

                     valueType = TokenType.FLOATING;
                 }

                 // Add number token.
                 add(valueType, startPosition);
             }

             // ECMA 15.12.1.1 The JSON Lexical Grammar - JSONEscapeCharacter
             @Override
             protected boolean isEscapeCharacter(final char ch) {
                 switch (ch) {
                     case '"':
                     case '/':
                     case '\\':
                     case 'b':
                     case 'f':
                     case 'n':
                     case 'r':
                     case 't':
                     // could be unicode escape
                     case 'u':
                         return true;
                     default:
                         return false;
                 }
             }
         };

         k = -1;

         next();

         final Node resultNode = jsonLiteral();
         expect(EOF);

         return resultNode;
     }

     @SuppressWarnings("fallthrough")
     private LiteralNode<?> getStringLiteral() {
         final LiteralNode<?> literal = getLiteral();
         final String         str     = (String)literal.getValue();

         for (int i = 0; i < str.length(); i++) {
             final char ch = str.charAt(i);
             switch (ch) {
             default:
                 if (ch > 0x001f) {
                     break;
                 }
             case '"':
             case '\\':
                 throw error(AbstractParser.message("unexpected.token", str));
             }
         }

         return literal;
     }

     /**
      * Parse a JSON literal from the token stream
      * @return the JSON literal as a Node
      */
     private Expression jsonLiteral() {
         final long literalToken = token;

         switch (type) {
         case STRING:
             return getStringLiteral();
         case ESCSTRING:
         case DECIMAL:
         case FLOATING:
             return getLiteral();
         case FALSE:
             next();
             return LiteralNode.newInstance(literalToken, finish, false);
         case TRUE:
             next();
             return LiteralNode.newInstance(literalToken, finish, true);
         case NULL:
             next();
             return LiteralNode.newInstance(literalToken, finish);
         case LBRACKET:
             return arrayLiteral();
         case LBRACE:
             return objectLiteral();
         /*
          * A.8.1 JSON Lexical Grammar
          *
          * JSONNumber :: See 15.12.1.1
          *    -opt DecimalIntegerLiteral JSONFractionopt ExponentPartopt
          */
         case SUB:
             next();

             final long realToken = token;
             final Object value = getValue();

             if (value instanceof Number) {
                 next();
                 return new UnaryNode(literalToken, LiteralNode.newInstance(realToken, finish, (Number)value));
             }

             throw error(AbstractParser.message("expected", "number", type.getNameOrType()));
         default:
             break;
         }

         throw error(AbstractParser.message("expected", "json literal", type.getNameOrType()));
     }

     /**
      * Parse an array literal from the token stream
      * @return the array literal as a Node
      */
     private LiteralNode<Expression[]> arrayLiteral() {
         // Unlike JavaScript array literals, elison is not permitted in JSON.

         // Capture LBRACKET token.
         final long arrayToken = token;
         // LBRACKET tested in caller.
         next();

         LiteralNode<Expression[]> result = null;
         // Prepare to accummulating elements.
         final List<Expression> elements = new ArrayList<>();

 loop:
         while (true) {
             switch (type) {
             case RBRACKET:
                 next();
                 result = LiteralNode.newInstance(arrayToken, finish, elements);
                 break loop;

             case COMMARIGHT:
                 next();
                 // check for trailing comma - not allowed in JSON
                 if (type == RBRACKET) {
                     throw error(AbstractParser.message("trailing.comma.in.json", type.getNameOrType()));
                 }
                 break;

             default:
                 // Add expression element.
                 elements.add(jsonLiteral());
                 // Comma between array elements is mandatory in JSON.
                 if (type != COMMARIGHT && type != RBRACKET) {
                    throw error(AbstractParser.message("expected", ", or ]", type.getNameOrType()));
                 }
                 break;
             }
         }

         return result;
     }

     /**
      * Parse an object literal from the token stream
      * @return the object literal as a Node
      */
     private ObjectNode objectLiteral() {
         // Capture LBRACE token.
         final long objectToken = token;
         // LBRACE tested in caller.
         next();

         // Prepare to accumulate elements.
         final List<PropertyNode> elements = new ArrayList<>();

         // Create a block for the object literal.
 loop:
         while (true) {
             switch (type) {
             case RBRACE:
                 next();
                 break loop;

             case COMMARIGHT:
                 next();
                 // check for trailing comma - not allowed in JSON
                 if (type == RBRACE) {
                     throw error(AbstractParser.message("trailing.comma.in.json", type.getNameOrType()));
                 }
                 break;

             default:
                 // Get and add the next property.
                 final PropertyNode property = propertyAssignment();
                 elements.add(property);

                 // Comma between property assigments is mandatory in JSON.
                 if (type != RBRACE && type != COMMARIGHT) {
                     throw error(AbstractParser.message("expected", ", or }", type.getNameOrType()));
                 }
                 break;
             }
         }

         // Construct new object literal.
         return new ObjectNode(objectToken, finish, elements);
     }

     /**
      * Parse a property assignment from the token stream
      * @return the property assignment as a Node
      */
     private PropertyNode propertyAssignment() {
         // Capture firstToken.
         final long propertyToken = token;
         LiteralNode<?> name = null;

         if (type == STRING) {
             name = getStringLiteral();
         } else if (type == ESCSTRING) {
             name = getLiteral();
         }

         if (name != null) {
             expect(COLON);
             final Expression value = jsonLiteral();
             return new PropertyNode(propertyToken, value.getFinish(), name, value, null, null);
         }

         // Raise an error.
         throw error(AbstractParser.message("expected", "string", type.getNameOrType()));
     }

 }
	/*
	* Copyright (c) 2010, 2013, Oracle and/or its affiliates. All rights reserved.
	* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
	*
	* This code is free software; you can redistribute it and/or modify it
	* under the terms of the GNU General Public License version 2 only, as
	* published by the Free Software Foundation. Oracle designates this
	* particular file as subject to the "Classpath" exception as provided
	* by Oracle in the LICENSE file that accompanied this code.
	*
	* This code is distributed in the hope that it will be useful, but WITHOUT
	* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
	* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
	* version 2 for more details (a copy is included in the LICENSE file that
	* accompanied this code).
	*
	* You should have received a copy of the GNU General Public License version
	* 2 along with this work; if not, write to the Free Software Foundation,
	* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
	*
	* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
	* or visit www.oracle.com if you need additional information or have any
	* questions.
	*/

	package jdk.nashorn.internal.parser;

	import static jdk.nashorn.internal.parser.TokenType.COLON;
	import static jdk.nashorn.internal.parser.TokenType.COMMARIGHT;
	import static jdk.nashorn.internal.parser.TokenType.EOF;
	import static jdk.nashorn.internal.parser.TokenType.ESCSTRING;
	import static jdk.nashorn.internal.parser.TokenType.RBRACE;
	import static jdk.nashorn.internal.parser.TokenType.RBRACKET;
	import static jdk.nashorn.internal.parser.TokenType.STRING;

	import java.util.ArrayList;
	import java.util.List;
	import jdk.nashorn.internal.ir.Expression;
	import jdk.nashorn.internal.ir.LiteralNode;
	import jdk.nashorn.internal.ir.Node;
	import jdk.nashorn.internal.ir.ObjectNode;
	import jdk.nashorn.internal.ir.PropertyNode;
	import jdk.nashorn.internal.ir.UnaryNode;
	import jdk.nashorn.internal.runtime.ErrorManager;
	import jdk.nashorn.internal.runtime.Source;

	/**
	* Parses JSON text and returns the corresponding IR node. This is derived from the objectLiteral production of the main parser.
	*
	* See: 15.12.1.2 The JSON Syntactic Grammar
	*/
	public class JSONParser extends AbstractParser {

	/**
	* Constructor
	* @param source the source
	* @param errors the error manager
	*/
	public JSONParser(final Source source, final ErrorManager errors) {
	super(source, errors, false, 0);
	}

	/**
	* Implementation of the Quote(value) operation as defined in the ECMA script spec
	* It wraps a String value in double quotes and escapes characters within in
	*
	* @param value string to quote
	*
	* @return quoted and escaped string
	*/
	public static String quote(final String value) {

	final StringBuilder product = new StringBuilder();

	product.append("\"");

	for (final char ch : value.toCharArray()) {
	// TODO: should use a table?
	switch (ch) {
	case '\\':
	product.append("\\\\");
	break;
	case '"':
	product.append("\\\"");
	break;
	case '\b':
	product.append("\\b");
	break;
	case '\f':
	product.append("\\f");
	break;
	case '\n':
	product.append("\\n");
	break;
	case '\r':
	product.append("\\r");
	break;
	case '\t':
	product.append("\\t");
	break;
	default:
	if (ch < ' ') {
	product.append(Lexer.unicodeEscape(ch));
	break;
	}

	product.append(ch);
	break;
	}
	}

	product.append("\"");

	return product.toString();
	}

	/**
	* Public parsed method - start lexing a new token stream for
	* a JSON script
	*
	* @return the JSON literal
	*/
	public Node parse() {
	stream = new TokenStream();

	lexer = new Lexer(source, stream) {

	@Override
	protected boolean skipComments() {
	return false;
	}

	@Override
	protected boolean isStringDelimiter(final char ch) {
	return ch == '\"';
	}

	// ECMA 15.12.1.1 The JSON Lexical Grammar - JSONWhiteSpace
	@Override
	protected boolean isWhitespace(final char ch) {
	return Lexer.isJsonWhitespace(ch);
	}

	@Override
	protected boolean isEOL(final char ch) {
	return Lexer.isJsonEOL(ch);
	}

	// ECMA 15.12.1.1 The JSON Lexical Grammar - JSONNumber
	@Override
	protected void scanNumber() {
	// Record beginning of number.
	final int startPosition = position;
	// Assume value is a decimal.
	TokenType valueType = TokenType.DECIMAL;

	// floating point can't start with a "." with no leading digit before
	if (ch0 == '.') {
	error(Lexer.message("json.invalid.number"), STRING, position, limit);
	}

	// First digit of number.
	final int digit = convertDigit(ch0, 10);

	// skip first digit
	skip(1);

	if (digit != 0) {
	// Skip over remaining digits.
	while (convertDigit(ch0, 10) != -1) {
	skip(1);
	}
	}

	if (ch0 == '.' \|\| ch0 == 'E' \|\| ch0 == 'e') {
	// Must be a double.
	if (ch0 == '.') {
	// Skip period.
	skip(1);

	boolean mantissa = false;
	// Skip mantissa.
	while (convertDigit(ch0, 10) != -1) {
	mantissa = true;
	skip(1);
	}

	if (! mantissa) {
	// no digit after "."
	error(Lexer.message("json.invalid.number"), STRING, position, limit);
	}
	}

	// Detect exponent.
	if (ch0 == 'E' \|\| ch0 == 'e') {
	// Skip E.
	skip(1);
	// Detect and skip exponent sign.
	if (ch0 == '+' \|\| ch0 == '-') {
	skip(1);
	}
	boolean exponent = false;
	// Skip exponent.
	while (convertDigit(ch0, 10) != -1) {
	exponent = true;
	skip(1);
	}

	if (! exponent) {
	// no digit after "E"
	error(Lexer.message("json.invalid.number"), STRING, position, limit);
	}
	}

	valueType = TokenType.FLOATING;
	}

	// Add number token.
	add(valueType, startPosition);
	}

	// ECMA 15.12.1.1 The JSON Lexical Grammar - JSONEscapeCharacter
	@Override
	protected boolean isEscapeCharacter(final char ch) {
	switch (ch) {
	case '"':
	case '/':
	case '\\':
	case 'b':
	case 'f':
	case 'n':
	case 'r':
	case 't':
	// could be unicode escape
	case 'u':
	return true;
	default:
	return false;
	}
	}
	};

	k = -1;

	next();

	final Node resultNode = jsonLiteral();
	expect(EOF);

	return resultNode;
	}

	@SuppressWarnings("fallthrough")
	private LiteralNode<?> getStringLiteral() {
	final LiteralNode<?> literal = getLiteral();
	final String str = (String)literal.getValue();

	for (int i = 0; i < str.length(); i++) {
	final char ch = str.charAt(i);
	switch (ch) {
	default:
	if (ch > 0x001f) {
	break;
	}
	case '"':
	case '\\':
	throw error(AbstractParser.message("unexpected.token", str));
	}
	}

	return literal;
	}

	/**
	* Parse a JSON literal from the token stream
	* @return the JSON literal as a Node
	*/
	private Expression jsonLiteral() {
	final long literalToken = token;

	switch (type) {
	case STRING:
	return getStringLiteral();
	case ESCSTRING:
	case DECIMAL:
	case FLOATING:
	return getLiteral();
	case FALSE:
	next();
	return LiteralNode.newInstance(literalToken, finish, false);
	case TRUE:
	next();
	return LiteralNode.newInstance(literalToken, finish, true);
	case NULL:
	next();
	return LiteralNode.newInstance(literalToken, finish);
	case LBRACKET:
	return arrayLiteral();
	case LBRACE:
	return objectLiteral();
	/*
	* A.8.1 JSON Lexical Grammar
	*
	* JSONNumber :: See 15.12.1.1
	* -opt DecimalIntegerLiteral JSONFractionopt ExponentPartopt
	*/
	case SUB:
	next();

	final long realToken = token;
	final Object value = getValue();

	if (value instanceof Number) {
	next();
	return new UnaryNode(literalToken, LiteralNode.newInstance(realToken, finish, (Number)value));
	}

	throw error(AbstractParser.message("expected", "number", type.getNameOrType()));
	default:
	break;
	}

	throw error(AbstractParser.message("expected", "json literal", type.getNameOrType()));
	}

	/**
	* Parse an array literal from the token stream
	* @return the array literal as a Node
	*/
	private LiteralNode<Expression[]> arrayLiteral() {
	// Unlike JavaScript array literals, elison is not permitted in JSON.

	// Capture LBRACKET token.
	final long arrayToken = token;
	// LBRACKET tested in caller.
	next();

	LiteralNode<Expression[]> result = null;
	// Prepare to accummulating elements.
	final List<Expression> elements = new ArrayList<>();

	loop:
	while (true) {
	switch (type) {
	case RBRACKET:
	next();
	result = LiteralNode.newInstance(arrayToken, finish, elements);
	break loop;

	case COMMARIGHT:
	next();
	// check for trailing comma - not allowed in JSON
	if (type == RBRACKET) {
	throw error(AbstractParser.message("trailing.comma.in.json", type.getNameOrType()));
	}
	break;

	default:
	// Add expression element.
	elements.add(jsonLiteral());
	// Comma between array elements is mandatory in JSON.
	if (type != COMMARIGHT && type != RBRACKET) {
	throw error(AbstractParser.message("expected", ", or ]", type.getNameOrType()));
	}
	break;
	}
	}

	return result;
	}

	/**
	* Parse an object literal from the token stream
	* @return the object literal as a Node
	*/
	private ObjectNode objectLiteral() {
	// Capture LBRACE token.
	final long objectToken = token;
	// LBRACE tested in caller.
	next();

	// Prepare to accumulate elements.
	final List<PropertyNode> elements = new ArrayList<>();

	// Create a block for the object literal.
	loop:
	while (true) {
	switch (type) {
	case RBRACE:
	next();
	break loop;

	case COMMARIGHT:
	next();
	// check for trailing comma - not allowed in JSON
	if (type == RBRACE) {
	throw error(AbstractParser.message("trailing.comma.in.json", type.getNameOrType()));
	}
	break;

	default:
	// Get and add the next property.
	final PropertyNode property = propertyAssignment();
	elements.add(property);

	// Comma between property assigments is mandatory in JSON.
	if (type != RBRACE && type != COMMARIGHT) {
	throw error(AbstractParser.message("expected", ", or }", type.getNameOrType()));
	}
	break;
	}
	}

	// Construct new object literal.
	return new ObjectNode(objectToken, finish, elements);
	}

	/**
	* Parse a property assignment from the token stream
	* @return the property assignment as a Node
	*/
	private PropertyNode propertyAssignment() {
	// Capture firstToken.
	final long propertyToken = token;
	LiteralNode<?> name = null;

	if (type == STRING) {
	name = getStringLiteral();
	} else if (type == ESCSTRING) {
	name = getLiteral();
	}

	if (name != null) {
	expect(COLON);
	final Expression value = jsonLiteral();
	return new PropertyNode(propertyToken, value.getFinish(), name, value, null, null);
	}

	// Raise an error.
	throw error(AbstractParser.message("expected", "string", type.getNameOrType()));
	}

	}