Refactoring of the string path syntax parser (#115)

* recursive toPath * 🔨 smaller functions * 🔨 simpler parseQuotedBracketNotation Ain't RegExp cool? * 🔨 parseBareBracketNotation using regexp * 👌 🔨 use functions more aligned with intent * 💡 🎨 jsdoc and split long lines * 🔨 moar regexes? * 🔨 only regexes! 😈 * 🔨 better lisibility (?) using a helper match function * ✨ path syntax: leading dot now ignored * 🔨 renamed vars to avoid shadowing * 🔨 path syntax parser: match function spreads results into downstream functions * 🚨 fix lint * 💡 fix jsdoc * 👌 🔨 explicit regexp parser creation * 👌 🔨 parser combinators * 🔨 adapting to new code organization * ⏪ reverting merge mistakes * 💡 fix jsdoc
zenika-open-source · Nov 29, 2017 · c41b27c · c41b27c
1 parent 132d1ff
commit c41b27c
Show file tree

Hide file tree

Showing 5 changed files with 159 additions and 168 deletions.
diff --git a/packages/immutadot/src/core/parser.utils.js b/packages/immutadot/src/core/parser.utils.js
@@ -0,0 +1,74 @@
+/**
+ * @typedef {function(string): T | null} Parser<T>
+ * @memberof core
+ * @private
+ * @since 1.0.0
+ */
+
+const maybeMap = (maybe, fn) => maybe === null ? maybe : fn(maybe)
+
+/**
+ * Creates a parser from a regular expression by matching the input string with
+ * the regular expression, returning the resulting match object.
+ * @function
+ * @memberof core
+ * @param {RegExp} regexp the regular expression
+ * @return {core.Parser<string[]>} the resulting parser
+ * @private
+ * @since 1.0.0
+ */
+export const regexp = regexp => str => maybeMap(str.match(regexp), match => match.slice(1))
+
+/**
+ * Returns a new parser that will return <code>null</code> if a predicate about
+ * the result of another parser does not hold. If the predicate holds then
+ * the new parser returns the result of the other parser unchanged.
+ * @function
+ * @memberof core
+ * @param {core.Parser<T>} parser parser to filter
+ * @param {function(*): boolean} predicate predicate to use
+ * @return {core.Parser<T>} resulting parser
+ * @private
+ * @since 1.0.0
+ */
+export const filter = (parser, predicate) => str => maybeMap(parser(str), parsed => predicate(parsed) ? parsed : null)
+
+/**
+ * Returns a new parser which will post-process the result of another parser.
+ * @function
+ * @memberof core
+ * @param {core.Parser<T>} parser parser for which to process the result
+ * @param {function(T): R} mapper function to transform the result of the parser
+ * @return {core.Parser<R>} resulting parser
+ * @private
+ * @since 1.0.0
+ */
+export const map = (parser, mapper) => str => maybeMap(parser(str), mapper)
+
+/**
+ * Returns a new parser that attempts parsing with a first parser then falls
+ * back to a second parser if the first returns <code>null</code>.
+ * @function
+ * @memberof core
+ * @param {core.Parser<A>} parser the first parser
+ * @param {core.Parser<B>} other the second parser
+ * @return {core.Parser<A | B>} resulting parser
+ * @private
+ * @since 1.0.0
+ */
+export const fallback = (parser, other) => str => {
+  const parsed = parser(str)
+  if (parsed !== null) return parsed
+  return other(str)
+}
+
+/**
+ * Chains a list of parsers together using <code>fallback</code>.
+ * @function
+ * @memberof core
+ * @param {Array<core.Parser<*>>} parsers a list of parsers to try in order
+ * @return {core.Parser<*>} resulting parser
+ * @private
+ * @since 1.0.0
+ */
+export const race = parsers => parsers.reduce((chainedParser, parser) => fallback(chainedParser, parser))
diff --git a/packages/immutadot/src/core/path.utils.js b/packages/immutadot/src/core/path.utils.js
@@ -10,6 +10,8 @@ const getSliceBound = (value, defaultValue, length) => {
 
 /**
  * Get the actual bounds of a slice.
+ * @function
+ * @memberof core
  * @param {Array<number>} bounds The bounds of the slice
  * @param {number} length The length of the actual array
  * @returns {Array<number>} The actual bounds of the slice

diff --git a/packages/immutadot/src/core/toPath.js b/packages/immutadot/src/core/toPath.js
@@ -1,3 +1,10 @@
+import {
+  filter,
+  map,
+  race,
+  regexp,
+} from './parser.utils'
+
 import {
   isSymbol,
   toString,
@@ -24,44 +31,18 @@ const toKey = arg => {
   return toString(arg)
 }
 
-const quotes = ['"', '\'']
-
 /**
- * Tests whether <code>index</code>th char of <code>str</code> is a quote.<br />
- * Quotes are <code>"</code> and <code>'</code>.
+ * Strip slashes preceding occurences of <code>quote</code> from <code>str</code><br />
+ * Possible quotes are <code>"</code> and <code>'</code>.
  * @function
  * @param {string} str The string
- * @param {number} index Index of the char to test
- * @return {{ quoted: boolean, quote: string }} A boolean <code>quoted</code>, true if <code>str.charAt(index)</code> is a quote and the <code>quote</code>.
+ * @param {string} quote The quote to unescape
+ * @return {string} The unescaped string
  * @memberof core
  * @private
  * @since 1.0.0
  */
-const isQuoteChar = (str, index) => {
-  const char = str.charAt(index)
-  const quote = quotes.find(c => c === char)
-  return {
-    quoted: Boolean(quote),
-    quote,
-  }
-}
-
-const escapedQuotesRegexps = {}
-for (const quote of quotes)
-  escapedQuotesRegexps[quote] = new RegExp(`\\\\${quote}`, 'g')
-
-  /**
-   * Strip slashes preceding occurences of <code>quote</code> from <code>str</code><br />
-   * Possible quotes are <code>"</code> and <code>'</code>.
-   * @function
-   * @param {string} str The string
-   * @param {string} quote The quote to unescape
-   * @return {string} The unescaped string
-   * @memberof core
-   * @private
-   * @since 1.0.0
-   */
-const unescapeQuotes = (str, quote) => str.replace(escapedQuotesRegexps[quote], quote)
+const unescapeQuotes = (str, quote) => str.replace(new RegExp(`\\\\${quote}`, 'g'), quote)
 
 /**
  * Converts <code>str</code> to a slice index.
@@ -77,13 +58,25 @@ const toSliceIndex = str => str === '' ? undefined : Number(str)
 /**
  * Tests whether <code>arg</code> is a valid slice index, that is <code>undefined</code> or a valid int.
  * @function
+ * @memberof core
  * @param {*} arg The value to test
  * @return {boolean} True if <code>arg</code> is a valid slice index, false otherwise.
  * @private
  * @since 1.0.0
  */
 const isSliceIndex = arg => arg === undefined || Number.isSafeInteger(arg)
 
+/**
+ * Tests whether <code>arg</code> is a valid slice index once converted to a number.
+ * @function
+ * @memberof core
+ * @param {*} arg The value to test
+ * @return {boolean} True if <code>arg</code> is a valid slice index once converted to a number, false otherwise.
+ * @private
+ * @since 1.0.0
+ */
+const isSliceIndexString = arg => isSliceIndex(arg ? Number(arg) : undefined)
+
 /**
  * Wraps <code>fn</code> allowing to call it with an array instead of a string.<br />
  * The returned function behaviour is :<br />
@@ -102,6 +95,50 @@ const allowingArrays = fn => arg => {
   return fn(toString(arg))
 }
 
+const emptyStringParser = str => str.length === 0 ? [] : null
+
+const quotedBracketNotationParser = map(
+  regexp(/^\[(['"])(.*?[^\\])\1\]?\.?(.*)$/),
+  ([quote, property, rest]) => [unescapeQuotes(property, quote), ...stringToPath(rest)],
+)
+
+const incompleteQuotedBracketNotationParser = map(
+  regexp(/^\[["'](.*)$/),
+  ([rest]) => rest ? [rest] : [],
+)
+
+const bareBracketNotationParser = map(
+  regexp(/^\[([^\]]*)\]\.?(.*)$/),
+  ([property, rest]) => {
+    return isIndex(Number(property))
+      ? [Number(property), ...stringToPath(rest)]
+      : [property, ...stringToPath(rest)]
+  },
+)
+
+const incompleteBareBracketNotationParser = map(
+  regexp(/^\[(.*)$/),
+  ([rest]) => rest ? [rest] : [],
+)
+
+const sliceNotationParser = map(
+  filter(
+    regexp(/^\[([^:\]]*):([^:\]]*)\]\.?(.*)$/),
+    ([sliceStart, sliceEnd]) => isSliceIndexString(sliceStart) && isSliceIndexString(sliceEnd),
+  ),
+  ([sliceStart, sliceEnd, rest]) => [[toSliceIndex(sliceStart), toSliceIndex(sliceEnd)], ...stringToPath(rest)],
+)
+
+const pathSegmentEndedByDotParser = map(
+  regexp(/^([^.[]*?)\.(.*)$/),
+  ([beforeDot, afterDot]) => [beforeDot, ...stringToPath(afterDot)],
+)
+
+const pathSegmentEndedByBracketParser = map(
+  regexp(/^([^.[]*?)(\[.*)$/),
+  ([beforeBracket, atBracket]) => [beforeBracket, ...stringToPath(atBracket)],
+)
+
 /**
  * Converts <code>str</code> to a path represented as an array of keys.
  * @function
@@ -111,141 +148,17 @@ const allowingArrays = fn => arg => {
  * @private
  * @since 1.0.0
  */
-const stringToPath = str => {
-  const path = []
-  let index = 0
-
-  while (true) { // eslint-disable-line no-constant-condition
-    // Look for new dot or opening square bracket
-    const nextPointIndex = str.indexOf('.', index)
-    const nextBracketIndex = str.indexOf('[', index)
-
-    // If neither one is found add the end of str to the path and stop
-    if (nextPointIndex === -1 && nextBracketIndex === -1) {
-      path.push(str.substring(index))
-      break
-    }
-
-    let isArrayNotation = false
-
-    // If a dot is found before an opening square bracket
-    if (nextPointIndex !== -1 && (nextBracketIndex === -1 || nextPointIndex < nextBracketIndex)) {
-      // Add the text preceding the dot to the path and move index after the dot
-      path.push(str.substring(index, nextPointIndex))
-      index = nextPointIndex + 1
-
-      // If an opening square bracket follows the dot,
-      // enable array notation and move index after the bracket
-      if (nextBracketIndex === nextPointIndex + 1) {
-        isArrayNotation = true
-        index = nextBracketIndex + 1
-      }
-
-    // If an opening square bracket is found before a dot
-    } else if (nextBracketIndex !== -1) {
-      // Enable array notation
-      isArrayNotation = true
-
-      // If any text precedes the bracket, add it to the path
-      if (nextBracketIndex !== index)
-        path.push(str.substring(index, nextBracketIndex))
-
-      // Move index after the bracket
-      index = nextBracketIndex + 1
-    }
-
-    // If array notation is enabled
-    if (isArrayNotation) {
-      // Check if next character is a string quote
-      const { quoted, quote } = isQuoteChar(str, index)
-
-      // If array index is a quoted string
-      if (quoted) {
-        // Move index after the string quote
-        index++
-
-        // Look for the next unescaped matching string quote
-        let endQuoteIndex, quotedIndex = index
-        do {
-          endQuoteIndex = str.indexOf(quote, quotedIndex)
-          quotedIndex = endQuoteIndex + 1
-        } while (endQuoteIndex !== -1 && str.charAt(endQuoteIndex - 1) === '\\')
-
-        // If no end quote found, stop if end of str is reached, or continue to next iteration
-        if (endQuoteIndex === -1) {
-          if (index !== str.length) path.push(str.substring(index))
-          break
-        }
-
-        // Add the content of quotes to the path, unescaping escaped quotes
-        path.push(unescapeQuotes(str.substring(index, endQuoteIndex), quote))
-
-        // Move index after end quote
-        index = endQuoteIndex + 1
-
-        // If next character is a closing square bracket, move index after it
-        if (str.charAt(index) === ']') index++
-
-        // Stop if end of str has been reached
-        if (index === str.length) break
-
-        // If next character is a dot, move index after it (skip it)
-        if (str.charAt(index) === '.') index++
-
-      } else { // If array index is not a quoted string
-
-        // Look for the closing square bracket
-        const closingBracketIndex = str.indexOf(']', index)
-
-        // If no closing bracket found, stop if end of str is reached, or continue to next iteration
-        if (closingBracketIndex === -1) {
-          if (index !== str.length) path.push(str.substring(index))
-          break
-        }
-
-        // Fetch the content of brackets and move index after closing bracket
-        const arrayIndexValue = str.substring(index, closingBracketIndex)
-        index = closingBracketIndex + 1
-
-        // If next character is a dot, move index after it (skip it)
-        if (str.charAt(index) === '.') index++
-
-        // Shorthand: if array index is the whole slice add it to path
-        if (arrayIndexValue === ':') {
-          path.push([undefined, undefined])
-        } else {
-
-          // Look for a slice quote
-          const sliceDelimIndex = arrayIndexValue.indexOf(':')
-
-          // If no slice quote found
-          if (sliceDelimIndex === -1) {
-            // Parse array index as a number
-            const nArrayIndexValue = Number(arrayIndexValue)
-
-            // Add array index to path, either as a valid index (positive int), or as a string
-            path.push(isIndex(nArrayIndexValue) ? nArrayIndexValue : arrayIndexValue)
-
-          } else { // If a slice quote is found
-
-            // Fetch slice start and end, and parse them as slice indexes (empty or valid int)
-            const sliceStart = arrayIndexValue.substring(0, sliceDelimIndex), sliceEnd = arrayIndexValue.substring(sliceDelimIndex + 1)
-            const nSliceStart = toSliceIndex(sliceStart), nSliceEnd = toSliceIndex(sliceEnd)
-
-            // Add array index to path, as a slice if both slice indexes are valid (undefined or int), or as a string
-            path.push(isSliceIndex(nSliceStart) && isSliceIndex(nSliceEnd) ? [nSliceStart, nSliceEnd] : arrayIndexValue)
-          }
-        }
-
-        // Stop if end of string has been reached
-        if (index === str.length) break
-      }
-    }
-
-  }
-
-  return path
-}
+const stringToPath = race([
+  emptyStringParser,
+  quotedBracketNotationParser,
+  incompleteQuotedBracketNotationParser,
+  sliceNotationParser,
+  bareBracketNotationParser,
+  incompleteBareBracketNotationParser,
+  pathSegmentEndedByDotParser,
+  pathSegmentEndedByBracketParser,
+  str => [str],
+])
 
 const MAX_CACHE_SIZE = 1000
 const cache = new Map()

diff --git a/packages/immutadot/src/core/toPath.spec.js b/packages/immutadot/src/core/toPath.spec.js
@@ -6,8 +6,8 @@ describe('ToPath', () => {
   it('should convert basic path', () => {
     expect(toPath('a.22.ccc')).toEqual(['a', '22', 'ccc'])
     // Empty properties should be kept
-    expect(toPath('.')).toEqual(['', ''])
-    expect(toPath('..')).toEqual(['', '', ''])
+    expect(toPath('.')).toEqual([''])
+    expect(toPath('..')).toEqual(['', ''])
     // If no separators, path should be interpreted as one property
     expect(toPath('\']"\\')).toEqual(['\']"\\'])
   })

diff --git a/packages/immutadot/src/util/lang.js b/packages/immutadot/src/util/lang.js
@@ -33,6 +33,8 @@ const isSymbol = arg => typeof arg === 'symbol'
 
 /**
  * Returns the length of <code>arg</code>.
+ * @function
+ * @memberof util
  * @param {*} arg The value of which length must be returned
  * @returns {number} The length of <code>arg</code>
  * @private