1// Copyright 2009 the V8 project authors. All rights reserved.
2// Redistribution and use in source and binary forms, with or without
3// modification, are permitted provided that the following conditions are
4// met:
5//
6//     * Redistributions of source code must retain the above copyright
7//       notice, this list of conditions and the following disclaimer.
8//     * Redistributions in binary form must reproduce the above
9//       copyright notice, this list of conditions and the following
10//       disclaimer in the documentation and/or other materials provided
11//       with the distribution.
12//     * Neither the name of Google Inc. nor the names of its
13//       contributors may be used to endorse or promote products derived
14//       from this software without specific prior written permission.
15//
16// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
17// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
18// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
19// A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
20// OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
21// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
22// LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
23// DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
24// THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
25// (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
26// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27
28
29/**
30 * Creates a CSV lines parser.
31 */
32class CsvParser {
33  /**
34   * Converts \x00 and \u0000 escape sequences in the given string.
35   *
36   * @param {string} input field.
37   **/
38  escapeField(string) {
39    let nextPos = string.indexOf("\\");
40    if (nextPos === -1) return string;
41
42    let result = string.substring(0, nextPos);
43    // Escape sequences of the form \x00 and \u0000;
44    let endPos = string.length;
45    let pos = 0;
46    while (nextPos !== -1) {
47      let escapeIdentifier = string.charAt(nextPos + 1);
48      pos = nextPos + 2;
49      if (escapeIdentifier == 'n') {
50        result += '\n';
51        nextPos = pos;
52      } else if (escapeIdentifier == '\\') {
53        result += '\\';
54        nextPos = pos;
55      } else {
56        if (escapeIdentifier == 'x') {
57          // \x00 ascii range escapes consume 2 chars.
58          nextPos = pos + 2;
59        } else {
60          // \u0000 unicode range escapes consume 4 chars.
61          nextPos = pos + 4;
62        }
63        // Convert the selected escape sequence to a single character.
64        let escapeChars = string.substring(pos, nextPos);
65        result += String.fromCharCode(parseInt(escapeChars, 16));
66      }
67
68      // Continue looking for the next escape sequence.
69      pos = nextPos;
70      nextPos = string.indexOf("\\", pos);
71      // If there are no more escape sequences consume the rest of the string.
72      if (nextPos === -1) {
73        result += string.substr(pos);
74      } else if (pos != nextPos) {
75        result += string.substring(pos, nextPos);
76      }
77    }
78    return result;
79  }
80
81  /**
82   * Parses a line of CSV-encoded values. Returns an array of fields.
83   *
84   * @param {string} line Input line.
85   */
86  parseLine(line) {
87    var pos = 0;
88    var endPos = line.length;
89    var fields = [];
90    if (endPos == 0) return fields;
91    let nextPos = 0;
92    while(nextPos !== -1) {
93      nextPos = line.indexOf(',', pos);
94      let field;
95      if (nextPos === -1) {
96        field = line.substr(pos);
97      } else {
98        field = line.substring(pos, nextPos);
99      }
100      fields.push(this.escapeField(field));
101      pos = nextPos + 1;
102    };
103    return fields
104  }
105}
106