All files / dsv/base/parse/lib/states quoted_escape.js

45.23% Statements 57/126
100% Branches 1/1
0% Functions 0/1
45.23% Lines 57/126

Press n or j to go to the next uncovered block, b, p or k for the previous block.

1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 1271x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x 1x                                                                                                                                           1x 1x 1x 1x 1x  
/**
* @license Apache-2.0
*
* Copyright (c) 2022 The Stdlib Authors.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
*    http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
 
/* eslint-disable no-underscore-dangle */
 
'use strict';
 
// MODULES //
 
var logger = require( 'debug' );
var state2enum = require( './state2enum.js' );
 
 
// VARIABLES //
 
var debug = logger( 'state:quoted_escape' );
 
// Possible transition states...
var ERROR = state2enum[ 'error' ];
var QUOTED_FIELD = state2enum[ 'quoted_field' ];
 
 
// MAIN //
 
/**
* Returns a function for processing an escape sequence within a quoted field.
*
* ## Notes
*
* -   Within a quoted field, an escape sequence (only) escapes the quote sequence.
* -   In strict mode, if not immediately followed by a special character sequence, then the parser raises an exception.
* -   In non-strict mode, if not immediately followed by a special character sequence, then the escape sequence has no special meaning and is considered a normal character sequence.
*
* @private
* @param {Parser} parser - parser instance
* @returns {Function} processing function
*/
function processor( parser ) {
	var escapeLastIndex;
	var quoteLastIndex;
	var escapeLength;
	var strict;
	var quote;

	quoteLastIndex = parser._quoteLastIndex;
	quote = parser._quote;

	escapeLastIndex = parser._escapeLastIndex;
	escapeLength = parser._escapeLength;

	strict = parser._strict;

	return next;

	/**
	* Processes a character.
	*
	* @private
	* @param {string} ch - character
	* @returns {void}
	*/
	function next( ch ) {
		var cursor = parser._cursor;
		var idx = parser._eidx; // position of last escape character
		var d = cursor - idx;

		debug( 'Char: %s', ch );

		/*
		* Check for a quote sequence.
		*/
		if (
			d === quoteLastIndex &&
			ch === quote[ quoteLastIndex ] &&
			parser._scan( quote, quoteLastIndex )
		) {
			debug( 'Quote.' );
			parser._copyWithin( idx-escapeLastIndex, idx+1, quoteLastIndex )
				._rewind( escapeLength )
				._push( ch )
				._changeState( QUOTED_FIELD );
			return;
		}
		/*
		* Check for a non-special character sequence.
		*
		* ## Notes
		*
		* -   In strict mode, quote sequences must immediately follow an escape sequence. At some point, we'll have processed a greater number of characters than exists in a quote sequence, meaning that a quote sequence does not immediately follow the escape sequence which led to the current state. Once this happens, we're in an invalid state and must raise an exception, as not clear how the parser should interpret the preceding values (e.g., was the preceding escape sequence a mistake and should be ignored? are we missing a quote sequence? etc.).
		* -   In non-strict mode, we assume that the escape sequence is a normal character sequence.
		*/
		if ( d >= quoteLastIndex ) {
			if ( strict ) {
				debug( 'Error.' );
				parser._setErrorState( 'INVALID_QUOTED_ESCAPE' )._changeState( ERROR );
				return;
			}
			// Return to normal field processing:
			debug( 'Escape sequence is not followed by a quote sequence.' );
			parser._raiseWarning( 'INVALID_QUOTED_ESCAPE' )._push( ch )._changeState( QUOTED_FIELD );
			return;
		}
		// Continue processing until we can transition to a new state:
		parser._push( ch );
	}
}
 
 
// EXPORTS //
 
module.exports = processor;