UNPKG

kepler.gl

Version:

kepler.gl is a webgl based application to visualize large scale location data in the browser

489 lines (411 loc) 42.7 kB
'use strict'; Object.defineProperty(exports, "__esModule", { value: true }); var _typeof2 = require('babel-runtime/helpers/typeof'); var _typeof3 = _interopRequireDefault(_typeof2); var _extends2 = require('babel-runtime/helpers/extends'); var _extends3 = _interopRequireDefault(_extends2); var _toArray2 = require('babel-runtime/helpers/toArray'); var _toArray3 = _interopRequireDefault(_toArray2); exports.processCsvData = processCsvData; exports.getSampleForTypeAnalyze = getSampleForTypeAnalyze; exports.parseCsvDataByFieldType = parseCsvDataByFieldType; exports.getFieldsFromData = getFieldsFromData; exports.renameDuplicateFields = renameDuplicateFields; exports.analyzerTypeToFieldType = analyzerTypeToFieldType; exports.processRowObject = processRowObject; exports.processGeojson = processGeojson; exports.formatCsv = formatCsv; exports.validateInputData = validateInputData; var _d3Dsv = require('d3-dsv'); var _d3Array = require('d3-array'); var _window = require('global/window'); var _assert = require('assert'); var _assert2 = _interopRequireDefault(_assert); var _typeAnalyzer = require('type-analyzer'); var _geojsonNormalize = require('@mapbox/geojson-normalize'); var _geojsonNormalize2 = _interopRequireDefault(_geojsonNormalize); var _defaultSettings = require('../constants/default-settings'); var _dataUtils = require('../utils/data-utils'); function _interopRequireDefault(obj) { return obj && obj.__esModule ? obj : { default: obj }; } // if any of these value occurs in csv, parse it to null; // Copyright (c) 2018 Uber Technologies, Inc. // // Permission is hereby granted, free of charge, to any person obtaining a copy // of this software and associated documentation files (the "Software"), to deal // in the Software without restriction, including without limitation the rights // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell // copies of the Software, and to permit persons to whom the Software is // furnished to do so, subject to the following conditions: // // The above copyright notice and this permission notice shall be included in // all copies or substantial portions of the Software. // // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN // THE SOFTWARE. var CSV_NULLS = ['', 'null', 'NULL', 'Null', 'NaN']; function processCsvData(rawData) { // here we assume the csv file that people uploaded will have first row // as name of the column var _csvParseRows = (0, _d3Dsv.csvParseRows)(rawData), _csvParseRows2 = (0, _toArray3.default)(_csvParseRows), headerRow = _csvParseRows2[0], rows = _csvParseRows2.slice(1); if (!rows.length || !headerRow) { // looks like an empty file // resolve null, and catch them later in one place return null; } cleanUpFalsyCsvValue(rows); // No need to run type detection on every data point // here we get a list of none null values to run analyze on var sample = getSampleForTypeAnalyze({ fields: headerRow, allData: rows }); var fields = getFieldsFromData(sample, headerRow); fields.forEach(parseCsvDataByFieldType.bind(null, rows)); return { fields: fields, rows: rows }; } /** * get fields from csv data * * @param {array} fields - an array of fields name * @param {array} allData * @param {array} sampleCount * @returns {array} formatted fields */ function getSampleForTypeAnalyze(_ref) { var fields = _ref.fields, allData = _ref.allData, _ref$sampleCount = _ref.sampleCount, sampleCount = _ref$sampleCount === undefined ? 50 : _ref$sampleCount; var total = Math.min(sampleCount, allData.length); // const fieldOrder = fields.map(f => f.name); var sample = (0, _d3Array.range)(0, total, 1).map(function (d) { return {}; }); // collect sample data for each field fields.forEach(function (field, fieldIdx) { // data counter var i = 0; // sample counter var j = 0; while (j < total) { if (i >= allData.length) { // if depleted data pool sample[j][field] = null; j++; } else if ((0, _dataUtils.notNullorUndefined)(allData[i][fieldIdx])) { sample[j][field] = allData[i][fieldIdx]; j++; i++; } else { i++; } } }); return sample; } function cleanUpFalsyCsvValue(rows) { for (var i = 0; i < rows.length; i++) { for (var j = 0; j < rows[i].length; j++) { // analyzer will set any fields to 'string' if there are empty values // which will be parsed as '' by d3.csv // here we parse empty data as null // TODO: create warning when deltect `CSV_NULLS` in the data if (!rows[i][j] || CSV_NULLS.includes(rows[i][j])) { rows[i][j] = null; } } } } /** * Process uploaded csv file to parse value by field type * * @param {array} rows * @param {object} field * @param {number} i * @returns {void} */ function parseCsvDataByFieldType(rows, field, i) { var unixFormat = ['x', 'X']; rows.forEach(function (row) { if (row[i] !== null) { switch (field.type) { case _defaultSettings.ALL_FIELD_TYPES.real: row[i] = parseFloat(row[i]); break; // TODO: timestamp can be either '1495827326' or '2016-03-10 11:20' // if it's '1495827326' we pass it to int case _defaultSettings.ALL_FIELD_TYPES.timestamp: row[i] = unixFormat.includes(field.format) ? Number(row[i]) : row[i]; break; case _defaultSettings.ALL_FIELD_TYPES.integer: row[i] = parseInt(row[i], 10); break; case _defaultSettings.ALL_FIELD_TYPES.boolean: // 0 and 1 only field can also be boolean row[i] = row[i] === 'true' || row[i] === 'True' || row[i] === '1'; break; default: break; } } }); } /** * get fields from csv data * * @param {array} data * @param {array} fieldOrder * @returns {array} formatted fields */ function getFieldsFromData(data, fieldOrder) { // add a check for epoch timestamp var metadata = _typeAnalyzer.Analyzer.computeColMeta(data, [{ regex: /.*geojson|all_points/g, dataType: 'GEOMETRY' }]); var _renameDuplicateField = renameDuplicateFields(fieldOrder), fieldByIndex = _renameDuplicateField.fieldByIndex; return fieldOrder.reduce(function (orderedArray, field, index) { var name = fieldByIndex[index]; var fieldMeta = metadata.find(function (m) { return m.key === field; }); var _ref2 = fieldMeta || {}, type = _ref2.type, format = _ref2.format; orderedArray[index] = { name: name, format: format, // need this for mapbuilder conversion: filter type detection // category, tableFieldIndex: index + 1, type: analyzerTypeToFieldType(type) }; return orderedArray; }, []); } /** * pass in an array of field names, rename duplicated one * and return a map from old field index to new name * * @param {array} fieldOrder * @returns {Object} new field name by index */ function renameDuplicateFields(fieldOrder) { return fieldOrder.reduce(function (accu, field, i) { var allNames = accu.allNames; var fieldName = field; // add a counter to duplicated names if (allNames.includes(field)) { var counter = 0; while (allNames.includes(field + '-' + counter)) { counter++; } fieldName = field + '-' + counter; } accu.fieldByIndex[i] = fieldName; accu.allNames.push(fieldName); return accu; }, { allNames: [], fieldByIndex: {} }); } /** * Map Analyzer types to local field types * * @param {string} aType * @returns {string} corresponding type in ALL_FIELD_TYPES */ /* eslint-disable complexity */ function analyzerTypeToFieldType(aType) { var DATE = _typeAnalyzer.DATA_TYPES.DATE, TIME = _typeAnalyzer.DATA_TYPES.TIME, DATETIME = _typeAnalyzer.DATA_TYPES.DATETIME, NUMBER = _typeAnalyzer.DATA_TYPES.NUMBER, INT = _typeAnalyzer.DATA_TYPES.INT, FLOAT = _typeAnalyzer.DATA_TYPES.FLOAT, BOOLEAN = _typeAnalyzer.DATA_TYPES.BOOLEAN, STRING = _typeAnalyzer.DATA_TYPES.STRING, CITY = _typeAnalyzer.DATA_TYPES.CITY, GEOMETRY = _typeAnalyzer.DATA_TYPES.GEOMETRY, GEOMETRY_FROM_STRING = _typeAnalyzer.DATA_TYPES.GEOMETRY_FROM_STRING, ZIPCODE = _typeAnalyzer.DATA_TYPES.ZIPCODE, PAIR_GEOMETRY_FROM_STRING = _typeAnalyzer.DATA_TYPES.PAIR_GEOMETRY_FROM_STRING; // TODO: un recognized types // CURRENCY PERCENT NONE switch (aType) { case DATE: return _defaultSettings.ALL_FIELD_TYPES.date; case TIME: case DATETIME: return _defaultSettings.ALL_FIELD_TYPES.timestamp; case NUMBER: case FLOAT: return _defaultSettings.ALL_FIELD_TYPES.real; case INT: return _defaultSettings.ALL_FIELD_TYPES.integer; case BOOLEAN: return _defaultSettings.ALL_FIELD_TYPES.boolean; case GEOMETRY: case GEOMETRY_FROM_STRING: case PAIR_GEOMETRY_FROM_STRING: return _defaultSettings.ALL_FIELD_TYPES.geojson; case STRING: case CITY: case ZIPCODE: return _defaultSettings.ALL_FIELD_TYPES.string; default: _window.console.warn('Unsupported analyzer type: ' + aType); return _defaultSettings.ALL_FIELD_TYPES.string; } } /* eslint-enable complexity */ /* * Process rawData where each row is an object */ function processRowObject(rawData) { if (!rawData.length) { return null; } var keys = Object.keys(rawData[0]); var rows = rawData.map(function (d) { return keys.map(function (key) { return d[key]; }); }); var fields = getFieldsFromData(rawData, keys); return { fields: fields, rows: rows }; } function processGeojson(rawData) { var normalizedGeojson = (0, _geojsonNormalize2.default)(rawData); if (!normalizedGeojson || !Array.isArray(normalizedGeojson.features)) { // fail to normalize geojson return null; } // getting all feature fields var allData = normalizedGeojson.features.reduce(function (accu, f, i) { if (f.geometry) { accu.push((0, _extends3.default)({ // add feature to _geojson field _geojson: f }, f.properties || {})); } return accu; }, []); // get all the field var fields = allData.reduce(function (prev, curr) { Object.keys(curr).forEach(function (key) { if (!prev.includes(key)) { prev.push(key); } }); return prev; }, []); // make sure each feature has exact same fields allData.forEach(function (d) { fields.forEach(function (f) { if (!(f in d)) { d[f] = null; } }); }); return processRowObject(allData); } /** * On export data to csv * @param data * @param fields */ function formatCsv(data, fields) { var columns = fields.map(function (f) { return f.name; }); var formattedData = [columns]; // parse geojson object as string data.forEach(function (row) { formattedData.push(row.map(function (d, i) { return d && _defaultSettings.GEOJSON_FIELDS.geojson.includes(fields[i].name) ? JSON.stringify(d) : d; })); }); return (0, _d3Dsv.csvFormatRows)(formattedData); } /** * @param data * @returns {{allData: Array, fields: Array}} */ function validateInputData(data) { // TODO: add test /* * expected input data format * { * fields: [], * rows: [] * } */ var proceed = true; if (!data) { (0, _assert2.default)('receiveVisData: data cannot be null'); proceed = false; } else if (!Array.isArray(data.fields)) { (0, _assert2.default)('receiveVisData: expect data.fields to be an array'); proceed = false; } else if (!Array.isArray(data.rows)) { (0, _assert2.default)('receiveVisData: expect data.rows to be an array'); proceed = false; } if (!proceed) { return null; } var fields = data.fields, rows = data.rows; // check if all fields has name, format and type var allValid = fields.every(function (f, i) { if ((typeof f === 'undefined' ? 'undefined' : (0, _typeof3.default)(f)) !== 'object') { (0, _assert2.default)('fields needs to be an array of object, but find ' + f); return false; } if (!f.name) { (0, _assert2.default)('field.name is required but missing in field ' + JSON.stringify(f)); // assign a name f.name = 'column_' + i; } if (!_defaultSettings.ALL_FIELD_TYPES[f.type]) { (0, _assert2.default)('unknown field type ' + f.type); return false; } return f.type && f.format && f.name; }); if (allValid) { return { rows: rows, fields: fields }; } // if any field has missing type, recalculate it for everyone // because we simply lost faith in humanity var sampleData = getSampleForTypeAnalyze({ fields: fields.map(function (f) { return f.name; }), allData: rows }); var fieldOrder = fields.map(function (f) { return f.name; }); var meta = getFieldsFromData(sampleData, fieldOrder); var updatedFields = fields.map(function (f, i) { return (0, _extends3.default)({}, f, { type: meta[i].type, format: meta[i].format }); }); return { fields: updatedFields, rows: rows }; } exports.default = { processGeojson: processGeojson, processCsvData: processCsvData, processRowObject: processRowObject, analyzerTypeToFieldType: analyzerTypeToFieldType, getFieldsFromData: getFieldsFromData, parseCsvDataByFieldType: parseCsvDataByFieldType }; //# sourceMappingURL=data:application/json;charset=utf-8;base64,{"version":3,"sources":["../../src/processors/data-processor.js"],"names":["processCsvData","getSampleForTypeAnalyze","parseCsvDataByFieldType","getFieldsFromData","renameDuplicateFields","analyzerTypeToFieldType","processRowObject","processGeojson","formatCsv","validateInputData","CSV_NULLS","rawData","headerRow","rows","length","cleanUpFalsyCsvValue","sample","fields","allData","forEach","bind","sampleCount","total","Math","min","map","field","fieldIdx","i","j","includes","unixFormat","row","type","ALL_FIELD_TYPES","real","parseFloat","timestamp","format","Number","integer","parseInt","boolean","data","fieldOrder","metadata","Analyzer","computeColMeta","regex","dataType","fieldByIndex","reduce","orderedArray","index","name","fieldMeta","find","m","key","tableFieldIndex","accu","allNames","fieldName","counter","push","aType","DATE","AnalyzerDATA_TYPES","TIME","DATETIME","NUMBER","INT","FLOAT","BOOLEAN","STRING","CITY","GEOMETRY","GEOMETRY_FROM_STRING","ZIPCODE","PAIR_GEOMETRY_FROM_STRING","date","geojson","string","globalConsole","warn","keys","Object","d","normalizedGeojson","Array","isArray","features","f","geometry","_geojson","properties","prev","curr","columns","formattedData","GEOJSON_FIELDS","JSON","stringify","proceed","allValid","every","sampleData","meta","updatedFields"],"mappings":";;;;;;;;;;;;;;;;;;QAgCgBA,c,GAAAA,c;QAiCAC,uB,GAAAA,uB;QAmDAC,uB,GAAAA,uB;QAuCAC,iB,GAAAA,iB;QAkCAC,qB,GAAAA,qB;QA+BAC,uB,GAAAA,uB;QAkDAC,gB,GAAAA,gB;QAeAC,c,GAAAA,c;QA+CAC,S,GAAAA,S;QAqBAC,iB,GAAAA,iB;;AA7UhB;;AACA;;AACA;;AACA;;;;AACA;;AACA;;;;AACA;;AACA;;;;AAEA;AA7BA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;;AAYA,IAAMC,YAAY,CAAC,EAAD,EAAK,MAAL,EAAa,MAAb,EAAqB,MAArB,EAA6B,KAA7B,CAAlB;;AAEO,SAASV,cAAT,CAAwBW,OAAxB,EAAiC;;AAEtC;AACA;AAHsC,sBAKT,yBAAaA,OAAb,CALS;AAAA;AAAA,MAK/BC,SAL+B;AAAA,MAKjBC,IALiB;;AAOtC,MAAI,CAACA,KAAKC,MAAN,IAAgB,CAACF,SAArB,EAAgC;AAC9B;AACA;AACA,WAAO,IAAP;AACD;;AAEDG,uBAAqBF,IAArB;AACA;AACA;AACA,MAAMG,SAASf,wBAAwB,EAACgB,QAAQL,SAAT,EAAoBM,SAASL,IAA7B,EAAxB,CAAf;;AAEA,MAAMI,SAASd,kBAAkBa,MAAlB,EAA0BJ,SAA1B,CAAf;;AAEAK,SAAOE,OAAP,CAAejB,wBAAwBkB,IAAxB,CAA6B,IAA7B,EAAmCP,IAAnC,CAAf;;AAEA,SAAO,EAACI,cAAD,EAASJ,UAAT,EAAP;AACD;;AAED;;;;;;;;AAQO,SAASZ,uBAAT,OAAsE;AAAA,MAApCgB,MAAoC,QAApCA,MAAoC;AAAA,MAA5BC,OAA4B,QAA5BA,OAA4B;AAAA,8BAAnBG,WAAmB;AAAA,MAAnBA,WAAmB,oCAAL,EAAK;;AAC3E,MAAMC,QAAQC,KAAKC,GAAL,CAASH,WAAT,EAAsBH,QAAQJ,MAA9B,CAAd;AACA;AACA,MAAME,SAAS,oBAAM,CAAN,EAASM,KAAT,EAAgB,CAAhB,EAAmBG,GAAnB,CAAuB;AAAA,WAAM,EAAN;AAAA,GAAvB,CAAf;;AAEA;AACAR,SAAOE,OAAP,CAAe,UAACO,KAAD,EAAQC,QAAR,EAAqB;AAClC;AACA,QAAIC,IAAI,CAAR;AACA;AACA,QAAIC,IAAI,CAAR;;AAEA,WAAOA,IAAIP,KAAX,EAAkB;AAChB,UAAIM,KAAKV,QAAQJ,MAAjB,EAAyB;AACvB;AACAE,eAAOa,CAAP,EAAUH,KAAV,IAAmB,IAAnB;AACAG;AACD,OAJD,MAIO,IAAI,mCAAmBX,QAAQU,CAAR,EAAWD,QAAX,CAAnB,CAAJ,EAA8C;AACnDX,eAAOa,CAAP,EAAUH,KAAV,IAAmBR,QAAQU,CAAR,EAAWD,QAAX,CAAnB;AACAE;AACAD;AACD,OAJM,MAIA;AACLA;AACD;AACF;AACF,GAnBD;;AAqBA,SAAOZ,MAAP;AACD;;AAED,SAASD,oBAAT,CAA8BF,IAA9B,EAAoC;AAClC,OAAK,IAAIe,IAAI,CAAb,EAAgBA,IAAIf,KAAKC,MAAzB,EAAiCc,GAAjC,EAAsC;AACpC,SAAK,IAAIC,IAAI,CAAb,EAAgBA,IAAIhB,KAAKe,CAAL,EAAQd,MAA5B,EAAoCe,GAApC,EAAyC;AACvC;AACA;AACA;AACA;AACA,UAAI,CAAChB,KAAKe,CAAL,EAAQC,CAAR,CAAD,IAAenB,UAAUoB,QAAV,CAAmBjB,KAAKe,CAAL,EAAQC,CAAR,CAAnB,CAAnB,EAAmD;AACjDhB,aAAKe,CAAL,EAAQC,CAAR,IAAa,IAAb;AACD;AACF;AACF;AACF;AACD;;;;;;;;AAQO,SAAS3B,uBAAT,CAAiCW,IAAjC,EAAuCa,KAAvC,EAA8CE,CAA9C,EAAiD;AACtD,MAAMG,aAAa,CAAC,GAAD,EAAM,GAAN,CAAnB;;AAEAlB,OAAKM,OAAL,CAAa,eAAO;AAClB,QAAIa,IAAIJ,CAAJ,MAAW,IAAf,EAAqB;AACnB,cAAQF,MAAMO,IAAd;AACE,aAAKC,iCAAgBC,IAArB;AACEH,cAAIJ,CAAJ,IAASQ,WAAWJ,IAAIJ,CAAJ,CAAX,CAAT;AACA;;AAEF;AACA;AACA,aAAKM,iCAAgBG,SAArB;AACEL,cAAIJ,CAAJ,IAASG,WAAWD,QAAX,CAAoBJ,MAAMY,MAA1B,IAAoCC,OAAOP,IAAIJ,CAAJ,CAAP,CAApC,GAAqDI,IAAIJ,CAAJ,CAA9D;AACA;;AAEF,aAAKM,iCAAgBM,OAArB;AACER,cAAIJ,CAAJ,IAASa,SAAST,IAAIJ,CAAJ,CAAT,EAAiB,EAAjB,CAAT;AACA;;AAEF,aAAKM,iCAAgBQ,OAArB;AACE;AACAV,cAAIJ,CAAJ,IAASI,IAAIJ,CAAJ,MAAW,MAAX,IAAqBI,IAAIJ,CAAJ,MAAW,MAAhC,IAA0CI,IAAIJ,CAAJ,MAAW,GAA9D;AACA;;AAEF;AACE;AArBJ;AAuBD;AACF,GA1BD;AA2BD;;AAED;;;;;;;AAOO,SAASzB,iBAAT,CAA2BwC,IAA3B,EAAiCC,UAAjC,EAA6C;AAClD;AACA,MAAMC,WAAWC,uBAASC,cAAT,CAAwBJ,IAAxB,EAA8B,CAC7C,EAACK,OAAO,uBAAR,EAAiCC,UAAU,UAA3C,EAD6C,CAA9B,CAAjB;;AAFkD,8BAM3B7C,sBAAsBwC,UAAtB,CAN2B;AAAA,MAM3CM,YAN2C,yBAM3CA,YAN2C;;AAQlD,SAAON,WAAWO,MAAX,CAAkB,UAACC,YAAD,EAAe1B,KAAf,EAAsB2B,KAAtB,EAAgC;AACvD,QAAMC,OAAOJ,aAAaG,KAAb,CAAb;AACA,QAAME,YAAYV,SAASW,IAAT,CAAc;AAAA,aAAKC,EAAEC,GAAF,KAAUhC,KAAf;AAAA,KAAd,CAAlB;;AAFuD,gBAGhC6B,aAAa,EAHmB;AAAA,QAGhDtB,IAHgD,SAGhDA,IAHgD;AAAA,QAG1CK,MAH0C,SAG1CA,MAH0C;;AAKvDc,iBAAaC,KAAb,IAAsB;AACpBC,gBADoB;AAEpBhB,oBAFoB;;AAIpB;AACA;AACAqB,uBAAiBN,QAAQ,CANL;AAOpBpB,YAAM5B,wBAAwB4B,IAAxB;AAPc,KAAtB;;AAUA,WAAOmB,YAAP;AACD,GAhBM,EAgBJ,EAhBI,CAAP;AAiBD;;AAED;;;;;;;AAOO,SAAShD,qBAAT,CAA+BwC,UAA/B,EAA2C;AAChD,SAAOA,WAAWO,MAAX,CACL,UAACS,IAAD,EAAOlC,KAAP,EAAcE,CAAd,EAAoB;AAAA,QACXiC,QADW,GACCD,IADD,CACXC,QADW;;AAElB,QAAIC,YAAYpC,KAAhB;;AAEA;AACA,QAAImC,SAAS/B,QAAT,CAAkBJ,KAAlB,CAAJ,EAA8B;AAC5B,UAAIqC,UAAU,CAAd;AACA,aAAOF,SAAS/B,QAAT,CAAqBJ,KAArB,SAA8BqC,OAA9B,CAAP,EAAiD;AAC/CA;AACD;AACDD,kBAAepC,KAAf,SAAwBqC,OAAxB;AACD;;AAEDH,SAAKV,YAAL,CAAkBtB,CAAlB,IAAuBkC,SAAvB;AACAF,SAAKC,QAAL,CAAcG,IAAd,CAAmBF,SAAnB;;AAEA,WAAOF,IAAP;AACD,GAlBI,EAmBL,EAACC,UAAU,EAAX,EAAeX,cAAc,EAA7B,EAnBK,CAAP;AAqBD;;AAED;;;;;;AAMA;AACO,SAAS7C,uBAAT,CAAiC4D,KAAjC,EAAwC;AAAA,MAE3CC,IAF2C,GAezCC,wBAfyC,CAE3CD,IAF2C;AAAA,MAG3CE,IAH2C,GAezCD,wBAfyC,CAG3CC,IAH2C;AAAA,MAI3CC,QAJ2C,GAezCF,wBAfyC,CAI3CE,QAJ2C;AAAA,MAK3CC,MAL2C,GAezCH,wBAfyC,CAK3CG,MAL2C;AAAA,MAM3CC,GAN2C,GAezCJ,wBAfyC,CAM3CI,GAN2C;AAAA,MAO3CC,KAP2C,GAezCL,wBAfyC,CAO3CK,KAP2C;AAAA,MAQ3CC,OAR2C,GAezCN,wBAfyC,CAQ3CM,OAR2C;AAAA,MAS3CC,MAT2C,GAezCP,wBAfyC,CAS3CO,MAT2C;AAAA,MAU3CC,IAV2C,GAezCR,wBAfyC,CAU3CQ,IAV2C;AAAA,MAW3CC,QAX2C,GAezCT,wBAfyC,CAW3CS,QAX2C;AAAA,MAY3CC,oBAZ2C,GAezCV,wBAfyC,CAY3CU,oBAZ2C;AAAA,MAa3CC,OAb2C,GAezCX,wBAfyC,CAa3CW,OAb2C;AAAA,MAc3CC,yBAd2C,GAezCZ,wBAfyC,CAc3CY,yBAd2C;;AAiB7C;AACA;;AACA,UAAQd,KAAR;AACE,SAAKC,IAAL;AACE,aAAOhC,iCAAgB8C,IAAvB;AACF,SAAKZ,IAAL;AACA,SAAKC,QAAL;AACE,aAAOnC,iCAAgBG,SAAvB;AACF,SAAKiC,MAAL;AACA,SAAKE,KAAL;AACE,aAAOtC,iCAAgBC,IAAvB;AACF,SAAKoC,GAAL;AACE,aAAOrC,iCAAgBM,OAAvB;AACF,SAAKiC,OAAL;AACE,aAAOvC,iCAAgBQ,OAAvB;AACF,SAAKkC,QAAL;AACA,SAAKC,oBAAL;AACA,SAAKE,yBAAL;AACE,aAAO7C,iCAAgB+C,OAAvB;AACF,SAAKP,MAAL;AACA,SAAKC,IAAL;AACA,SAAKG,OAAL;AACE,aAAO5C,iCAAgBgD,MAAvB;AACF;AACEC,sBAAcC,IAAd,iCAAiDnB,KAAjD;AACA,aAAO/B,iCAAgBgD,MAAvB;AAvBJ;AAyBD;AACD;;AAEA;;;AAGO,SAAS5E,gBAAT,CAA0BK,OAA1B,EAAmC;AACxC,MAAI,CAACA,QAAQG,MAAb,EAAqB;AACnB,WAAO,IAAP;AACD;;AAED,MAAMuE,OAAOC,OAAOD,IAAP,CAAY1E,QAAQ,CAAR,CAAZ,CAAb;AACA,MAAME,OAAOF,QAAQc,GAAR,CAAY;AAAA,WAAK4D,KAAK5D,GAAL,CAAS;AAAA,aAAO8D,EAAE7B,GAAF,CAAP;AAAA,KAAT,CAAL;AAAA,GAAZ,CAAb;AACA,MAAMzC,SAASd,kBAAkBQ,OAAlB,EAA2B0E,IAA3B,CAAf;;AAEA,SAAO;AACLpE,kBADK;AAELJ;AAFK,GAAP;AAID;;AAEM,SAASN,cAAT,CAAwBI,OAAxB,EAAiC;AACtC,MAAM6E,oBAAoB,gCAAU7E,OAAV,CAA1B;;AAEA,MAAI,CAAC6E,iBAAD,IAAsB,CAACC,MAAMC,OAAN,CAAcF,kBAAkBG,QAAhC,CAA3B,EAAsE;AACpE;AACA,WAAO,IAAP;AACD;;AAED;AACA,MAAMzE,UAAUsE,kBAAkBG,QAAlB,CAA2BxC,MAA3B,CAAkC,UAACS,IAAD,EAAOgC,CAAP,EAAUhE,CAAV,EAAgB;AAChE,QAAIgE,EAAEC,QAAN,EAAgB;AACdjC,WAAKI,IAAL;AACE;AACA8B,kBAAUF;AAFZ,SAGMA,EAAEG,UAAF,IAAgB,EAHtB;AAKD;AACD,WAAOnC,IAAP;AACD,GATe,EASb,EATa,CAAhB;;AAWA;AACA,MAAM3C,SAASC,QAAQiC,MAAR,CAAe,UAAC6C,IAAD,EAAOC,IAAP,EAAgB;AAC5CX,WAAOD,IAAP,CAAYY,IAAZ,EAAkB9E,OAAlB,CAA0B,eAAO;AAC/B,UAAI,CAAC6E,KAAKlE,QAAL,CAAc4B,GAAd,CAAL,EAAyB;AACvBsC,aAAKhC,IAAL,CAAUN,GAAV;AACD;AACF,KAJD;AAKA,WAAOsC,IAAP;AACD,GAPc,EAOZ,EAPY,CAAf;;AASA;AACA9E,UAAQC,OAAR,CAAgB,aAAK;AACnBF,WAAOE,OAAP,CAAe,aAAK;AAClB,UAAI,EAAEyE,KAAKL,CAAP,CAAJ,EAAe;AACbA,UAAEK,CAAF,IAAO,IAAP;AACD;AACF,KAJD;AAKD,GAND;;AAQA,SAAOtF,iBAAiBY,OAAjB,CAAP;AACD;;AAED;;;;;AAKO,SAASV,SAAT,CAAmBmC,IAAnB,EAAyB1B,MAAzB,EAAiC;AACtC,MAAMiF,UAAUjF,OAAOQ,GAAP,CAAW;AAAA,WAAKmE,EAAEtC,IAAP;AAAA,GAAX,CAAhB;AACA,MAAM6C,gBAAgB,CAACD,OAAD,CAAtB;;AAEA;AACAvD,OAAKxB,OAAL,CAAa,eAAO;AAClBgF,kBAAcnC,IAAd,CACEhC,IAAIP,GAAJ,CACE,UAAC8D,CAAD,EAAI3D,CAAJ;AAAA,aAAU2D,KAAKa,gCAAenB,OAAf,CAAuBnD,QAAvB,CAAgCb,OAAOW,CAAP,EAAU0B,IAA1C,CAAL,GACR+C,KAAKC,SAAL,CAAef,CAAf,CADQ,GACYA,CADtB;AAAA,KADF,CADF;AAMD,GAPD;;AASA,SAAO,0BAAcY,aAAd,CAAP;AACD;;AAED;;;;AAIO,SAAS1F,iBAAT,CAA2BkC,IAA3B,EAAiC;AACtC;AACA;;;;;;;AAOA,MAAI4D,UAAU,IAAd;AACA,MAAI,CAAC5D,IAAL,EAAW;AACT,0BAAO,qCAAP;AACA4D,cAAU,KAAV;AACD,GAHD,MAGO,IAAI,CAACd,MAAMC,OAAN,CAAc/C,KAAK1B,MAAnB,CAAL,EAAiC;AACtC,0BAAO,mDAAP;AACAsF,cAAU,KAAV;AACD,GAHM,MAGA,IAAI,CAACd,MAAMC,OAAN,CAAc/C,KAAK9B,IAAnB,CAAL,EAA+B;AACpC,0BAAO,iDAAP;AACA0F,cAAU,KAAV;AACD;;AAED,MAAI,CAACA,OAAL,EAAc;AACZ,WAAO,IAAP;AACD;;AAvBqC,MAyB/BtF,MAzB+B,GAyBf0B,IAzBe,CAyB/B1B,MAzB+B;AAAA,MAyBvBJ,IAzBuB,GAyBf8B,IAzBe,CAyBvB9B,IAzBuB;;AA2BtC;;AACA,MAAM2F,WAAWvF,OAAOwF,KAAP,CAAa,UAACb,CAAD,EAAIhE,CAAJ,EAAU;AACtC,QAAI,QAAOgE,CAAP,uDAAOA,CAAP,OAAa,QAAjB,EAA2B;AACzB,iFAA0DA,CAA1D;AACA,aAAO,KAAP;AACD;;AAED,QAAI,CAACA,EAAEtC,IAAP,EAAa;AACX,6EACiD+C,KAAKC,SAAL,CAAeV,CAAf,CADjD;AAGA;AACAA,QAAEtC,IAAF,eAAmB1B,CAAnB;AACD;;AAED,QAAI,CAACM,iCAAgB0D,EAAE3D,IAAlB,CAAL,EAA8B;AAC5B,oDAA6B2D,EAAE3D,IAA/B;AACA,aAAO,KAAP;AACD;;AAED,WAAO2D,EAAE3D,IAAF,IAAU2D,EAAEtD,MAAZ,IAAsBsD,EAAEtC,IAA/B;AACD,GApBgB,CAAjB;;AAsBA,MAAIkD,QAAJ,EAAc;AACZ,WAAO,EAAC3F,UAAD,EAAOI,cAAP,EAAP;AACD;;AAED;AACA;AACA,MAAMyF,aAAazG,wBAAwB,EAACgB,QAAQA,OAAOQ,GAAP,CAAW;AAAA,aAAKmE,EAAEtC,IAAP;AAAA,KAAX,CAAT,EAAkCpC,SAASL,IAA3C,EAAxB,CAAnB;AACA,MAAM+B,aAAa3B,OAAOQ,GAAP,CAAW;AAAA,WAAKmE,EAAEtC,IAAP;AAAA,GAAX,CAAnB;AACA,MAAMqD,OAAOxG,kBAAkBuG,UAAlB,EAA8B9D,UAA9B,CAAb;AACA,MAAMgE,gBAAgB3F,OAAOQ,GAAP,CAAW,UAACmE,CAAD,EAAIhE,CAAJ;AAAA,sCAC5BgE,CAD4B;AAE/B3D,YAAM0E,KAAK/E,CAAL,EAAQK,IAFiB;AAG/BK,cAAQqE,KAAK/E,CAAL,EAAQU;AAHe;AAAA,GAAX,CAAtB;;AAMA,SAAO,EAACrB,QAAQ2F,aAAT,EAAwB/F,UAAxB,EAAP;AACD;;kBAEc;AACbN,gCADa;AAEbP,gCAFa;AAGbM,oCAHa;AAIbD,kDAJa;AAKbF,sCALa;AAMbD;AANa,C","file":"data-processor.js","sourcesContent":["// Copyright (c) 2018 Uber Technologies, Inc.\n//\n// Permission is hereby granted, free of charge, to any person obtaining a copy\n// of this software and associated documentation files (the \"Software\"), to deal\n// in the Software without restriction, including without limitation the rights\n// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell\n// copies of the Software, and to permit persons to whom the Software is\n// furnished to do so, subject to the following conditions:\n//\n// The above copyright notice and this permission notice shall be included in\n// all copies or substantial portions of the Software.\n//\n// THE SOFTWARE IS PROVIDED \"AS IS\", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR\n// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,\n// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE\n// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER\n// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,\n// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN\n// THE SOFTWARE.\n\nimport {csvParseRows, csvFormatRows} from 'd3-dsv';\nimport {range} from 'd3-array';\nimport {console as globalConsole} from 'global/window';\nimport assert from 'assert';\nimport {Analyzer, DATA_TYPES as AnalyzerDATA_TYPES} from 'type-analyzer';\nimport normalize from '@mapbox/geojson-normalize';\nimport {ALL_FIELD_TYPES, GEOJSON_FIELDS} from 'constants/default-settings';\nimport {notNullorUndefined} from 'utils/data-utils';\n\n// if any of these value occurs in csv, parse it to null;\nconst CSV_NULLS = ['', 'null', 'NULL', 'Null', 'NaN'];\n\nexport function processCsvData(rawData) {\n\n  // here we assume the csv file that people uploaded will have first row\n  // as name of the column\n  //TODO: add a alert at upload csv to remind define first row\n  const [headerRow, ...rows] = csvParseRows(rawData);\n\n  if (!rows.length || !headerRow) {\n    // looks like an empty file\n    // resolve null, and catch them later in one place\n    return null;\n  }\n\n  cleanUpFalsyCsvValue(rows);\n  // No need to run type detection on every data point\n  // here we get a list of none null values to run analyze on\n  const sample = getSampleForTypeAnalyze({fields: headerRow, allData: rows});\n\n  const fields = getFieldsFromData(sample, headerRow);\n\n  fields.forEach(parseCsvDataByFieldType.bind(null, rows));\n\n  return {fields, rows};\n}\n\n/**\n * get fields from csv data\n *\n * @param {array} fields - an array of fields name\n * @param {array} allData\n * @param {array} sampleCount\n * @returns {array} formatted fields\n */\nexport function getSampleForTypeAnalyze({fields, allData, sampleCount = 50}) {\n  const total = Math.min(sampleCount, allData.length);\n  // const fieldOrder = fields.map(f => f.name);\n  const sample = range(0, total, 1).map(d => ({}));\n\n  // collect sample data for each field\n  fields.forEach((field, fieldIdx) => {\n    // data counter\n    let i = 0;\n    // sample counter\n    let j = 0;\n\n    while (j < total) {\n      if (i >= allData.length) {\n        // if depleted data pool\n        sample[j][field] = null;\n        j++;\n      } else if (notNullorUndefined(allData[i][fieldIdx])) {\n        sample[j][field] = allData[i][fieldIdx];\n        j++;\n        i++;\n      } else {\n        i++;\n      }\n    }\n  });\n\n  return sample;\n}\n\nfunction cleanUpFalsyCsvValue(rows) {\n  for (let i = 0; i < rows.length; i++) {\n    for (let j = 0; j < rows[i].length; j++) {\n      // analyzer will set any fields to 'string' if there are empty values\n      // which will be parsed as '' by d3.csv\n      // here we parse empty data as null\n      // TODO: create warning when deltect `CSV_NULLS` in the data\n      if (!rows[i][j] || CSV_NULLS.includes(rows[i][j])) {\n        rows[i][j] = null;\n      }\n    }\n  }\n}\n/**\n * Process uploaded csv file to parse value by field type\n *\n * @param {array} rows\n * @param {object} field\n * @param {number} i\n * @returns {void}\n */\nexport function parseCsvDataByFieldType(rows, field, i) {\n  const unixFormat = ['x', 'X'];\n\n  rows.forEach(row => {\n    if (row[i] !== null) {\n      switch (field.type) {\n        case ALL_FIELD_TYPES.real:\n          row[i] = parseFloat(row[i]);\n          break;\n\n        // TODO: timestamp can be either '1495827326' or '2016-03-10 11:20'\n        // if it's '1495827326' we pass it to int\n        case ALL_FIELD_TYPES.timestamp:\n          row[i] = unixFormat.includes(field.format) ? Number(row[i]) : row[i];\n          break;\n\n        case ALL_FIELD_TYPES.integer:\n          row[i] = parseInt(row[i], 10);\n          break;\n\n        case ALL_FIELD_TYPES.boolean:\n          // 0 and 1 only field can also be boolean\n          row[i] = row[i] === 'true' || row[i] === 'True' || row[i] === '1';\n          break;\n\n        default:\n          break;\n      }\n    }\n  });\n}\n\n/**\n * get fields from csv data\n *\n * @param {array} data\n * @param {array} fieldOrder\n * @returns {array} formatted fields\n */\nexport function getFieldsFromData(data, fieldOrder) {\n  // add a check for epoch timestamp\n  const metadata = Analyzer.computeColMeta(data, [\n    {regex: /.*geojson|all_points/g, dataType: 'GEOMETRY'}\n  ]);\n\n  const {fieldByIndex} = renameDuplicateFields(fieldOrder);\n\n  return fieldOrder.reduce((orderedArray, field, index) => {\n    const name = fieldByIndex[index];\n    const fieldMeta = metadata.find(m => m.key === field);\n    const {type, format} = fieldMeta || {};\n\n    orderedArray[index] = {\n      name,\n      format,\n\n      // need this for mapbuilder conversion: filter type detection\n      // category,\n      tableFieldIndex: index + 1,\n      type: analyzerTypeToFieldType(type)\n    };\n\n    return orderedArray;\n  }, []);\n}\n\n/**\n * pass in an array of field names, rename duplicated one\n * and return a map from old field index to new name\n *\n * @param {array} fieldOrder\n * @returns {Object} new field name by index\n */\nexport function renameDuplicateFields(fieldOrder) {\n  return fieldOrder.reduce(\n    (accu, field, i) => {\n      const {allNames} = accu;\n      let fieldName = field;\n\n      // add a counter to duplicated names\n      if (allNames.includes(field)) {\n        let counter = 0;\n        while (allNames.includes(`${field}-${counter}`)) {\n          counter++;\n        }\n        fieldName = `${field}-${counter}`;\n      }\n\n      accu.fieldByIndex[i] = fieldName;\n      accu.allNames.push(fieldName);\n\n      return accu;\n    },\n    {allNames: [], fieldByIndex: {}}\n  );\n}\n\n/**\n * Map Analyzer types to local field types\n *\n * @param {string} aType\n * @returns {string} corresponding type in ALL_FIELD_TYPES\n */\n/* eslint-disable complexity */\nexport function analyzerTypeToFieldType(aType) {\n  const {\n    DATE,\n    TIME,\n    DATETIME,\n    NUMBER,\n    INT,\n    FLOAT,\n    BOOLEAN,\n    STRING,\n    CITY,\n    GEOMETRY,\n    GEOMETRY_FROM_STRING,\n    ZIPCODE,\n    PAIR_GEOMETRY_FROM_STRING\n  } = AnalyzerDATA_TYPES;\n\n  // TODO: un recognized types\n  // CURRENCY PERCENT NONE\n  switch (aType) {\n    case DATE:\n      return ALL_FIELD_TYPES.date;\n    case TIME:\n    case DATETIME:\n      return ALL_FIELD_TYPES.timestamp;\n    case NUMBER:\n    case FLOAT:\n      return ALL_FIELD_TYPES.real;\n    case INT:\n      return ALL_FIELD_TYPES.integer;\n    case BOOLEAN:\n      return ALL_FIELD_TYPES.boolean;\n    case GEOMETRY:\n    case GEOMETRY_FROM_STRING:\n    case PAIR_GEOMETRY_FROM_STRING:\n      return ALL_FIELD_TYPES.geojson;\n    case STRING:\n    case CITY:\n    case ZIPCODE:\n      return ALL_FIELD_TYPES.string;\n    default:\n      globalConsole.warn(`Unsupported analyzer type: ${aType}`);\n      return ALL_FIELD_TYPES.string;\n  }\n}\n/* eslint-enable complexity */\n\n/*\n * Process rawData where each row is an object\n */\nexport function processRowObject(rawData) {\n  if (!rawData.length) {\n    return null;\n  }\n\n  const keys = Object.keys(rawData[0]);\n  const rows = rawData.map(d => keys.map(key => d[key]));\n  const fields = getFieldsFromData(rawData, keys);\n\n  return {\n    fields,\n    rows\n  };\n}\n\nexport function processGeojson(rawData) {\n  const normalizedGeojson = normalize(rawData);\n\n  if (!normalizedGeojson || !Array.isArray(normalizedGeojson.features)) {\n    // fail to normalize geojson\n    return null;\n  }\n\n  // getting all feature fields\n  const allData = normalizedGeojson.features.reduce((accu, f, i) => {\n    if (f.geometry) {\n      accu.push({\n        // add feature to _geojson field\n        _geojson: f,\n        ...(f.properties || {})\n      });\n    }\n    return accu;\n  }, []);\n\n  // get all the field\n  const fields = allData.reduce((prev, curr) => {\n    Object.keys(curr).forEach(key => {\n      if (!prev.includes(key)) {\n        prev.push(key);\n      }\n    });\n    return prev;\n  }, []);\n\n  // make sure each feature has exact same fields\n  allData.forEach(d => {\n    fields.forEach(f => {\n      if (!(f in d)) {\n        d[f] = null;\n      }\n    });\n  });\n\n  return processRowObject(allData);\n}\n\n/**\n * On export data to csv\n * @param data\n * @param fields\n */\nexport function formatCsv(data, fields) {\n  const columns = fields.map(f => f.name);\n  const formattedData = [columns];\n\n  // parse geojson object as string\n  data.forEach(row => {\n    formattedData.push(\n      row.map(\n        (d, i) => d && GEOJSON_FIELDS.geojson.includes(fields[i].name) ?\n          JSON.stringify(d) : d\n      )\n    )\n  });\n\n  return csvFormatRows(formattedData);\n}\n\n/**\n * @param data\n * @returns {{allData: Array, fields: Array}}\n */\nexport function validateInputData(data) {\n  // TODO: add test\n  /*\n   * expected input data format\n   * {\n   *   fields: [],\n   *   rows: []\n   * }\n   */\n  let proceed = true;\n  if (!data) {\n    assert('receiveVisData: data cannot be null');\n    proceed = false;\n  } else if (!Array.isArray(data.fields)) {\n    assert('receiveVisData: expect data.fields to be an array');\n    proceed = false;\n  } else if (!Array.isArray(data.rows)) {\n    assert('receiveVisData: expect data.rows to be an array');\n    proceed = false;\n  }\n\n  if (!proceed) {\n    return null;\n  }\n\n  const {fields, rows} = data;\n\n  // check if all fields has name, format and type\n  const allValid = fields.every((f, i) => {\n    if (typeof f !== 'object') {\n      assert(`fields needs to be an array of object, but find ${f}`);\n      return false;\n    }\n\n    if (!f.name) {\n      assert(\n        `field.name is required but missing in field ${JSON.stringify(f)}`\n      );\n      // assign a name\n      f.name = `column_${i}`;\n    }\n\n    if (!ALL_FIELD_TYPES[f.type]) {\n      assert(`unknown field type ${f.type}`);\n      return false;\n    }\n\n    return f.type && f.format && f.name;\n  });\n\n  if (allValid) {\n    return {rows, fields};\n  }\n\n  // if any field has missing type, recalculate it for everyone\n  // because we simply lost faith in humanity\n  const sampleData = getSampleForTypeAnalyze({fields: fields.map(f => f.name), allData: rows});\n  const fieldOrder = fields.map(f => f.name);\n  const meta = getFieldsFromData(sampleData, fieldOrder);\n  const updatedFields = fields.map((f, i) => ({\n    ...f,\n    type: meta[i].type,\n    format: meta[i].format\n  }));\n\n  return {fields: updatedFields, rows};\n}\n\nexport default {\n  processGeojson,\n  processCsvData,\n  processRowObject,\n  analyzerTypeToFieldType,\n  getFieldsFromData,\n  parseCsvDataByFieldType\n};\n"]}