UNPKG

read-excel-file

Version:

Read small to medium `*.xlsx` files in a browser or Node.js. Parse to JSON with a strict schema.

118 lines (107 loc) 7.79 kB
"use strict"; Object.defineProperty(exports, "__esModule", { value: true }); exports["default"] = readXlsx; var _parseProperties = _interopRequireDefault(require("./parseProperties.js")); var _parseFilePaths = _interopRequireDefault(require("./parseFilePaths.js")); var _parseStyles = _interopRequireDefault(require("./parseStyles.js")); var _parseSharedStrings = _interopRequireDefault(require("./parseSharedStrings.js")); var _parseSheet = _interopRequireDefault(require("./parseSheet.js")); var _getData = _interopRequireDefault(require("./getData.js")); function _interopRequireDefault(obj) { return obj && obj.__esModule ? obj : { "default": obj }; } function _typeof(o) { "@babel/helpers - typeof"; return _typeof = "function" == typeof Symbol && "symbol" == typeof Symbol.iterator ? function (o) { return typeof o; } : function (o) { return o && "function" == typeof Symbol && o.constructor === Symbol && o !== Symbol.prototype ? "symbol" : typeof o; }, _typeof(o); } function _createForOfIteratorHelperLoose(o, allowArrayLike) { var it = typeof Symbol !== "undefined" && o[Symbol.iterator] || o["@@iterator"]; if (it) return (it = it.call(o)).next.bind(it); if (Array.isArray(o) || (it = _unsupportedIterableToArray(o)) || allowArrayLike && o && typeof o.length === "number") { if (it) o = it; var i = 0; return function () { if (i >= o.length) return { done: true }; return { done: false, value: o[i++] }; }; } throw new TypeError("Invalid attempt to iterate non-iterable instance.\nIn order to be iterable, non-array objects must have a [Symbol.iterator]() method."); } function _unsupportedIterableToArray(o, minLen) { if (!o) return; if (typeof o === "string") return _arrayLikeToArray(o, minLen); var n = Object.prototype.toString.call(o).slice(8, -1); if (n === "Object" && o.constructor) n = o.constructor.name; if (n === "Map" || n === "Set") return Array.from(o); if (n === "Arguments" || /^(?:Ui|I)nt(?:8|16|32)(?:Clamped)?Array$/.test(n)) return _arrayLikeToArray(o, minLen); } function _arrayLikeToArray(arr, len) { if (len == null || len > arr.length) len = arr.length; for (var i = 0, arr2 = new Array(len); i < len; i++) arr2[i] = arr[i]; return arr2; } function ownKeys(e, r) { var t = Object.keys(e); if (Object.getOwnPropertySymbols) { var o = Object.getOwnPropertySymbols(e); r && (o = o.filter(function (r) { return Object.getOwnPropertyDescriptor(e, r).enumerable; })), t.push.apply(t, o); } return t; } function _objectSpread(e) { for (var r = 1; r < arguments.length; r++) { var t = null != arguments[r] ? arguments[r] : {}; r % 2 ? ownKeys(Object(t), !0).forEach(function (r) { _defineProperty(e, r, t[r]); }) : Object.getOwnPropertyDescriptors ? Object.defineProperties(e, Object.getOwnPropertyDescriptors(t)) : ownKeys(Object(t)).forEach(function (r) { Object.defineProperty(e, r, Object.getOwnPropertyDescriptor(t, r)); }); } return e; } function _defineProperty(obj, key, value) { key = _toPropertyKey(key); if (key in obj) { Object.defineProperty(obj, key, { value: value, enumerable: true, configurable: true, writable: true }); } else { obj[key] = value; } return obj; } function _toPropertyKey(arg) { var key = _toPrimitive(arg, "string"); return _typeof(key) === "symbol" ? key : String(key); } function _toPrimitive(input, hint) { if (_typeof(input) !== "object" || input === null) return input; var prim = input[Symbol.toPrimitive]; if (prim !== undefined) { var res = prim.call(input, hint || "default"); if (_typeof(res) !== "object") return res; throw new TypeError("@@toPrimitive must return a primitive value."); } return (hint === "string" ? String : Number)(input); } // For an introduction in reading `*.xlsx` files see "The minimum viable XLSX reader": // https://www.brendanlong.com/the-minimum-viable-xlsx-reader.html /** * Reads an (unzipped) XLSX file structure into a 2D array of cells. * @param {object} contents - A list of XML files inside XLSX file (which is a zipped directory). * @param {number?} options.sheet - Workbook sheet id (`1` by default). * @param {string?} options.dateFormat - Date format, e.g. "mm/dd/yyyy". Values having this format template set will be parsed as dates. * @param {object} contents - A list of XML files inside XLSX file (which is a zipped directory). * @return {object} An object of shape `{ data, cells, properties }`. `data: string[][]` is an array of rows, each row being an array of cell values. `cells: string[][]` is an array of rows, each row being an array of cells. `properties: object` is the spreadsheet properties (e.g. whether date epoch is 1904 instead of 1900). */ function readXlsx(contents, xml) { var options = arguments.length > 2 && arguments[2] !== undefined ? arguments[2] : {}; if (!options.sheet) { options = _objectSpread({ sheet: 1 }, options); } var getXmlFileContent = function getXmlFileContent(filePath) { if (!contents[filePath]) { throw new Error("\"".concat(filePath, "\" file not found inside the *.xlsx file zip archive")); } return contents[filePath]; }; // Some Excel editors don't want to use standard naming scheme for sheet files. // https://github.com/tidyverse/readxl/issues/104 var filePaths = (0, _parseFilePaths["default"])(getXmlFileContent('xl/_rels/workbook.xml.rels'), xml); // Default file path for "shared strings": "xl/sharedStrings.xml". var values = filePaths.sharedStrings ? (0, _parseSharedStrings["default"])(getXmlFileContent(filePaths.sharedStrings), xml) : []; // Default file path for "styles": "xl/styles.xml". var styles = filePaths.styles ? (0, _parseStyles["default"])(getXmlFileContent(filePaths.styles), xml) : {}; var properties = (0, _parseProperties["default"])(getXmlFileContent('xl/workbook.xml'), xml); // A feature for getting the list of sheets in an Excel file. // https://github.com/catamphetamine/read-excel-file/issues/14 if (options.getSheets) { return properties.sheets.map(function (_ref) { var name = _ref.name; return { name: name }; }); } // Find the sheet by name, or take the first one. var sheetId = getSheetId(options.sheet, properties.sheets); // If the sheet wasn't found then throw an error. // Example: "xl/worksheets/sheet1.xml". if (!sheetId || !filePaths.sheets[sheetId]) { throw createSheetNotFoundError(options.sheet, properties.sheets); } // Parse sheet data. var sheet = (0, _parseSheet["default"])(getXmlFileContent(filePaths.sheets[sheetId]), xml, values, styles, properties, options); options = _objectSpread({ // Create a `rowIndexMap` for the original dataset, if not passed, // because "empty" rows will be dropped from the input data. rowMap: [] }, options); // Get spreadsheet data. var data = (0, _getData["default"])(sheet, options); // Can return properties, if required. if (options.properties) { return { data: data, properties: properties }; } // Return spreadsheet data. return data; } function getSheetId(sheet, sheets) { if (typeof sheet === 'number') { var _sheet = sheets[sheet - 1]; return _sheet && _sheet.relationId; } for (var _iterator = _createForOfIteratorHelperLoose(sheets), _step; !(_step = _iterator()).done;) { var _sheet2 = _step.value; if (_sheet2.name === sheet) { return _sheet2.relationId; } } } function createSheetNotFoundError(sheet, sheets) { var sheetsList = sheets && sheets.map(function (sheet, i) { return "\"".concat(sheet.name, "\" (#").concat(i + 1, ")"); }).join(', '); return new Error("Sheet ".concat(typeof sheet === 'number' ? '#' + sheet : '"' + sheet + '"', " not found in the *.xlsx file.").concat(sheets ? ' Available sheets: ' + sheetsList + '.' : '')); } //# sourceMappingURL=readXlsx.js.map