kepler.gl
Version:
kepler.gl is a webgl based application to visualize large scale location data in the browser
489 lines (411 loc) • 42.7 kB
JavaScript
Object.defineProperty(exports, "__esModule", {
value: true
});
var _typeof2 = require('babel-runtime/helpers/typeof');
var _typeof3 = _interopRequireDefault(_typeof2);
var _extends2 = require('babel-runtime/helpers/extends');
var _extends3 = _interopRequireDefault(_extends2);
var _toArray2 = require('babel-runtime/helpers/toArray');
var _toArray3 = _interopRequireDefault(_toArray2);
exports.processCsvData = processCsvData;
exports.getSampleForTypeAnalyze = getSampleForTypeAnalyze;
exports.parseCsvDataByFieldType = parseCsvDataByFieldType;
exports.getFieldsFromData = getFieldsFromData;
exports.renameDuplicateFields = renameDuplicateFields;
exports.analyzerTypeToFieldType = analyzerTypeToFieldType;
exports.processRowObject = processRowObject;
exports.processGeojson = processGeojson;
exports.formatCsv = formatCsv;
exports.validateInputData = validateInputData;
var _d3Dsv = require('d3-dsv');
var _d3Array = require('d3-array');
var _window = require('global/window');
var _assert = require('assert');
var _assert2 = _interopRequireDefault(_assert);
var _typeAnalyzer = require('type-analyzer');
var _geojsonNormalize = require('@mapbox/geojson-normalize');
var _geojsonNormalize2 = _interopRequireDefault(_geojsonNormalize);
var _defaultSettings = require('../constants/default-settings');
var _dataUtils = require('../utils/data-utils');
function _interopRequireDefault(obj) { return obj && obj.__esModule ? obj : { default: obj }; }
// if any of these value occurs in csv, parse it to null;
// Copyright (c) 2018 Uber Technologies, Inc.
//
// Permission is hereby granted, free of charge, to any person obtaining a copy
// of this software and associated documentation files (the "Software"), to deal
// in the Software without restriction, including without limitation the rights
// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
// copies of the Software, and to permit persons to whom the Software is
// furnished to do so, subject to the following conditions:
//
// The above copyright notice and this permission notice shall be included in
// all copies or substantial portions of the Software.
//
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
// THE SOFTWARE.
var CSV_NULLS = ['', 'null', 'NULL', 'Null', 'NaN'];
function processCsvData(rawData) {
// here we assume the csv file that people uploaded will have first row
// as name of the column
var _csvParseRows = (0, _d3Dsv.csvParseRows)(rawData),
_csvParseRows2 = (0, _toArray3.default)(_csvParseRows),
headerRow = _csvParseRows2[0],
rows = _csvParseRows2.slice(1);
if (!rows.length || !headerRow) {
// looks like an empty file
// resolve null, and catch them later in one place
return null;
}
cleanUpFalsyCsvValue(rows);
// No need to run type detection on every data point
// here we get a list of none null values to run analyze on
var sample = getSampleForTypeAnalyze({ fields: headerRow, allData: rows });
var fields = getFieldsFromData(sample, headerRow);
fields.forEach(parseCsvDataByFieldType.bind(null, rows));
return { fields: fields, rows: rows };
}
/**
* get fields from csv data
*
* @param {array} fields - an array of fields name
* @param {array} allData
* @param {array} sampleCount
* @returns {array} formatted fields
*/
function getSampleForTypeAnalyze(_ref) {
var fields = _ref.fields,
allData = _ref.allData,
_ref$sampleCount = _ref.sampleCount,
sampleCount = _ref$sampleCount === undefined ? 50 : _ref$sampleCount;
var total = Math.min(sampleCount, allData.length);
// const fieldOrder = fields.map(f => f.name);
var sample = (0, _d3Array.range)(0, total, 1).map(function (d) {
return {};
});
// collect sample data for each field
fields.forEach(function (field, fieldIdx) {
// data counter
var i = 0;
// sample counter
var j = 0;
while (j < total) {
if (i >= allData.length) {
// if depleted data pool
sample[j][field] = null;
j++;
} else if ((0, _dataUtils.notNullorUndefined)(allData[i][fieldIdx])) {
sample[j][field] = allData[i][fieldIdx];
j++;
i++;
} else {
i++;
}
}
});
return sample;
}
function cleanUpFalsyCsvValue(rows) {
for (var i = 0; i < rows.length; i++) {
for (var j = 0; j < rows[i].length; j++) {
// analyzer will set any fields to 'string' if there are empty values
// which will be parsed as '' by d3.csv
// here we parse empty data as null
// TODO: create warning when deltect `CSV_NULLS` in the data
if (!rows[i][j] || CSV_NULLS.includes(rows[i][j])) {
rows[i][j] = null;
}
}
}
}
/**
* Process uploaded csv file to parse value by field type
*
* @param {array} rows
* @param {object} field
* @param {number} i
* @returns {void}
*/
function parseCsvDataByFieldType(rows, field, i) {
var unixFormat = ['x', 'X'];
rows.forEach(function (row) {
if (row[i] !== null) {
switch (field.type) {
case _defaultSettings.ALL_FIELD_TYPES.real:
row[i] = parseFloat(row[i]);
break;
// TODO: timestamp can be either '1495827326' or '2016-03-10 11:20'
// if it's '1495827326' we pass it to int
case _defaultSettings.ALL_FIELD_TYPES.timestamp:
row[i] = unixFormat.includes(field.format) ? Number(row[i]) : row[i];
break;
case _defaultSettings.ALL_FIELD_TYPES.integer:
row[i] = parseInt(row[i], 10);
break;
case _defaultSettings.ALL_FIELD_TYPES.boolean:
// 0 and 1 only field can also be boolean
row[i] = row[i] === 'true' || row[i] === 'True' || row[i] === '1';
break;
default:
break;
}
}
});
}
/**
* get fields from csv data
*
* @param {array} data
* @param {array} fieldOrder
* @returns {array} formatted fields
*/
function getFieldsFromData(data, fieldOrder) {
// add a check for epoch timestamp
var metadata = _typeAnalyzer.Analyzer.computeColMeta(data, [{ regex: /.*geojson|all_points/g, dataType: 'GEOMETRY' }]);
var _renameDuplicateField = renameDuplicateFields(fieldOrder),
fieldByIndex = _renameDuplicateField.fieldByIndex;
return fieldOrder.reduce(function (orderedArray, field, index) {
var name = fieldByIndex[index];
var fieldMeta = metadata.find(function (m) {
return m.key === field;
});
var _ref2 = fieldMeta || {},
type = _ref2.type,
format = _ref2.format;
orderedArray[index] = {
name: name,
format: format,
// need this for mapbuilder conversion: filter type detection
// category,
tableFieldIndex: index + 1,
type: analyzerTypeToFieldType(type)
};
return orderedArray;
}, []);
}
/**
* pass in an array of field names, rename duplicated one
* and return a map from old field index to new name
*
* @param {array} fieldOrder
* @returns {Object} new field name by index
*/
function renameDuplicateFields(fieldOrder) {
return fieldOrder.reduce(function (accu, field, i) {
var allNames = accu.allNames;
var fieldName = field;
// add a counter to duplicated names
if (allNames.includes(field)) {
var counter = 0;
while (allNames.includes(field + '-' + counter)) {
counter++;
}
fieldName = field + '-' + counter;
}
accu.fieldByIndex[i] = fieldName;
accu.allNames.push(fieldName);
return accu;
}, { allNames: [], fieldByIndex: {} });
}
/**
* Map Analyzer types to local field types
*
* @param {string} aType
* @returns {string} corresponding type in ALL_FIELD_TYPES
*/
/* eslint-disable complexity */
function analyzerTypeToFieldType(aType) {
var DATE = _typeAnalyzer.DATA_TYPES.DATE,
TIME = _typeAnalyzer.DATA_TYPES.TIME,
DATETIME = _typeAnalyzer.DATA_TYPES.DATETIME,
NUMBER = _typeAnalyzer.DATA_TYPES.NUMBER,
INT = _typeAnalyzer.DATA_TYPES.INT,
FLOAT = _typeAnalyzer.DATA_TYPES.FLOAT,
BOOLEAN = _typeAnalyzer.DATA_TYPES.BOOLEAN,
STRING = _typeAnalyzer.DATA_TYPES.STRING,
CITY = _typeAnalyzer.DATA_TYPES.CITY,
GEOMETRY = _typeAnalyzer.DATA_TYPES.GEOMETRY,
GEOMETRY_FROM_STRING = _typeAnalyzer.DATA_TYPES.GEOMETRY_FROM_STRING,
ZIPCODE = _typeAnalyzer.DATA_TYPES.ZIPCODE,
PAIR_GEOMETRY_FROM_STRING = _typeAnalyzer.DATA_TYPES.PAIR_GEOMETRY_FROM_STRING;
// TODO: un recognized types
// CURRENCY PERCENT NONE
switch (aType) {
case DATE:
return _defaultSettings.ALL_FIELD_TYPES.date;
case TIME:
case DATETIME:
return _defaultSettings.ALL_FIELD_TYPES.timestamp;
case NUMBER:
case FLOAT:
return _defaultSettings.ALL_FIELD_TYPES.real;
case INT:
return _defaultSettings.ALL_FIELD_TYPES.integer;
case BOOLEAN:
return _defaultSettings.ALL_FIELD_TYPES.boolean;
case GEOMETRY:
case GEOMETRY_FROM_STRING:
case PAIR_GEOMETRY_FROM_STRING:
return _defaultSettings.ALL_FIELD_TYPES.geojson;
case STRING:
case CITY:
case ZIPCODE:
return _defaultSettings.ALL_FIELD_TYPES.string;
default:
_window.console.warn('Unsupported analyzer type: ' + aType);
return _defaultSettings.ALL_FIELD_TYPES.string;
}
}
/* eslint-enable complexity */
/*
* Process rawData where each row is an object
*/
function processRowObject(rawData) {
if (!rawData.length) {
return null;
}
var keys = Object.keys(rawData[0]);
var rows = rawData.map(function (d) {
return keys.map(function (key) {
return d[key];
});
});
var fields = getFieldsFromData(rawData, keys);
return {
fields: fields,
rows: rows
};
}
function processGeojson(rawData) {
var normalizedGeojson = (0, _geojsonNormalize2.default)(rawData);
if (!normalizedGeojson || !Array.isArray(normalizedGeojson.features)) {
// fail to normalize geojson
return null;
}
// getting all feature fields
var allData = normalizedGeojson.features.reduce(function (accu, f, i) {
if (f.geometry) {
accu.push((0, _extends3.default)({
// add feature to _geojson field
_geojson: f
}, f.properties || {}));
}
return accu;
}, []);
// get all the field
var fields = allData.reduce(function (prev, curr) {
Object.keys(curr).forEach(function (key) {
if (!prev.includes(key)) {
prev.push(key);
}
});
return prev;
}, []);
// make sure each feature has exact same fields
allData.forEach(function (d) {
fields.forEach(function (f) {
if (!(f in d)) {
d[f] = null;
}
});
});
return processRowObject(allData);
}
/**
* On export data to csv
* @param data
* @param fields
*/
function formatCsv(data, fields) {
var columns = fields.map(function (f) {
return f.name;
});
var formattedData = [columns];
// parse geojson object as string
data.forEach(function (row) {
formattedData.push(row.map(function (d, i) {
return d && _defaultSettings.GEOJSON_FIELDS.geojson.includes(fields[i].name) ? JSON.stringify(d) : d;
}));
});
return (0, _d3Dsv.csvFormatRows)(formattedData);
}
/**
* @param data
* @returns {{allData: Array, fields: Array}}
*/
function validateInputData(data) {
// TODO: add test
/*
* expected input data format
* {
* fields: [],
* rows: []
* }
*/
var proceed = true;
if (!data) {
(0, _assert2.default)('receiveVisData: data cannot be null');
proceed = false;
} else if (!Array.isArray(data.fields)) {
(0, _assert2.default)('receiveVisData: expect data.fields to be an array');
proceed = false;
} else if (!Array.isArray(data.rows)) {
(0, _assert2.default)('receiveVisData: expect data.rows to be an array');
proceed = false;
}
if (!proceed) {
return null;
}
var fields = data.fields,
rows = data.rows;
// check if all fields has name, format and type
var allValid = fields.every(function (f, i) {
if ((typeof f === 'undefined' ? 'undefined' : (0, _typeof3.default)(f)) !== 'object') {
(0, _assert2.default)('fields needs to be an array of object, but find ' + f);
return false;
}
if (!f.name) {
(0, _assert2.default)('field.name is required but missing in field ' + JSON.stringify(f));
// assign a name
f.name = 'column_' + i;
}
if (!_defaultSettings.ALL_FIELD_TYPES[f.type]) {
(0, _assert2.default)('unknown field type ' + f.type);
return false;
}
return f.type && f.format && f.name;
});
if (allValid) {
return { rows: rows, fields: fields };
}
// if any field has missing type, recalculate it for everyone
// because we simply lost faith in humanity
var sampleData = getSampleForTypeAnalyze({ fields: fields.map(function (f) {
return f.name;
}), allData: rows });
var fieldOrder = fields.map(function (f) {
return f.name;
});
var meta = getFieldsFromData(sampleData, fieldOrder);
var updatedFields = fields.map(function (f, i) {
return (0, _extends3.default)({}, f, {
type: meta[i].type,
format: meta[i].format
});
});
return { fields: updatedFields, rows: rows };
}
exports.default = {
processGeojson: processGeojson,
processCsvData: processCsvData,
processRowObject: processRowObject,
analyzerTypeToFieldType: analyzerTypeToFieldType,
getFieldsFromData: getFieldsFromData,
parseCsvDataByFieldType: parseCsvDataByFieldType
};
//# sourceMappingURL=data:application/json;charset=utf-8;base64,{"version":3,"sources":["../../src/processors/data-processor.js"],"names":["processCsvData","getSampleForTypeAnalyze","parseCsvDataByFieldType","getFieldsFromData","renameDuplicateFields","analyzerTypeToFieldType","processRowObject","processGeojson","formatCsv","validateInputData","CSV_NULLS","rawData","headerRow","rows","length","cleanUpFalsyCsvValue","sample","fields","allData","forEach","bind","sampleCount","total","Math","min","map","field","fieldIdx","i","j","includes","unixFormat","row","type","ALL_FIELD_TYPES","real","parseFloat","timestamp","format","Number","integer","parseInt","boolean","data","fieldOrder","metadata","Analyzer","computeColMeta","regex","dataType","fieldByIndex","reduce","orderedArray","index","name","fieldMeta","find","m","key","tableFieldIndex","accu","allNames","fieldName","counter","push","aType","DATE","AnalyzerDATA_TYPES","TIME","DATETIME","NUMBER","INT","FLOAT","BOOLEAN","STRING","CITY","GEOMETRY","GEOMETRY_FROM_STRING","ZIPCODE","PAIR_GEOMETRY_FROM_STRING","date","geojson","string","globalConsole","warn","keys","Object","d","normalizedGeojson","Array","isArray","features","f","geometry","_geojson","properties","prev","curr","columns","formattedData","GEOJSON_FIELDS","JSON","stringify","proceed","allValid","every","sampleData","meta","updatedFields"],"mappings":";;;;;;;;;;;;;;;;;;QAgCgBA,c,GAAAA,c;QAiCAC,uB,GAAAA,uB;QAmDAC,uB,GAAAA,uB;QAuCAC,iB,GAAAA,iB;QAkCAC,qB,GAAAA,qB;QA+BAC,uB,GAAAA,uB;QAkDAC,gB,GAAAA,gB;QAeAC,c,GAAAA,c;QA+CAC,S,GAAAA,S;QAqBAC,iB,GAAAA,iB;;AA7UhB;;AACA;;AACA;;AACA;;;;AACA;;AACA;;;;AACA;;AACA;;;;AAEA;AA7BA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;AACA;;AAYA,IAAMC,YAAY,CAAC,EAAD,EAAK,MAAL,EAAa,MAAb,EAAqB,MAArB,EAA6B,KAA7B,CAAlB;;AAEO,SAASV,cAAT,CAAwBW,OAAxB,EAAiC;;AAEtC;AACA;AAHsC,sBAKT,yBAAaA,OAAb,CALS;AAAA;AAAA,MAK/BC,SAL+B;AAAA,MAKjBC,IALiB;;AAOtC,MAAI,CAACA,KAAKC,MAAN,IAAgB,CAACF,SAArB,EAAgC;AAC9B;AACA;AACA,WAAO,IAAP;AACD;;AAEDG,uBAAqBF,IAArB;AACA;AACA;AACA,MAAMG,SAASf,wBAAwB,EAACgB,QAAQL,SAAT,EAAoBM,SAASL,IAA7B,EAAxB,CAAf;;AAEA,MAAMI,SAASd,kBAAkBa,MAAlB,EAA0BJ,SAA1B,CAAf;;AAEAK,SAAOE,OAAP,CAAejB,wBAAwBkB,IAAxB,CAA6B,IAA7B,EAAmCP,IAAnC,CAAf;;AAEA,SAAO,EAACI,cAAD,EAASJ,UAAT,EAAP;AACD;;AAED;;;;;;;;AAQO,SAASZ,uBAAT,OAAsE;AAAA,MAApCgB,MAAoC,QAApCA,MAAoC;AAAA,MAA5BC,OAA4B,QAA5BA,OAA4B;AAAA,8BAAnBG,WAAmB;AAAA,MAAnBA,WAAmB,oCAAL,EAAK;;AAC3E,MAAMC,QAAQC,KAAKC,GAAL,CAASH,WAAT,EAAsBH,QAAQJ,MAA9B,CAAd;AACA;AACA,MAAME,SAAS,oBAAM,CAAN,EAASM,KAAT,EAAgB,CAAhB,EAAmBG,GAAnB,CAAuB;AAAA,WAAM,EAAN;AAAA,GAAvB,CAAf;;AAEA;AACAR,SAAOE,OAAP,CAAe,UAACO,KAAD,EAAQC,QAAR,EAAqB;AAClC;AACA,QAAIC,IAAI,CAAR;AACA;AACA,QAAIC,IAAI,CAAR;;AAEA,WAAOA,IAAIP,KAAX,EAAkB;AAChB,UAAIM,KAAKV,QAAQJ,MAAjB,EAAyB;AACvB;AACAE,eAAOa,CAAP,EAAUH,KAAV,IAAmB,IAAnB;AACAG;AACD,OAJD,MAIO,IAAI,mCAAmBX,QAAQU,CAAR,EAAWD,QAAX,CAAnB,CAAJ,EAA8C;AACnDX,eAAOa,CAAP,EAAUH,KAAV,IAAmBR,QAAQU,CAAR,EAAWD,QAAX,CAAnB;AACAE;AACAD;AACD,OAJM,MAIA;AACLA;AACD;AACF;AACF,GAnBD;;AAqBA,SAAOZ,MAAP;AACD;;AAED,SAASD,oBAAT,CAA8BF,IAA9B,EAAoC;AAClC,OAAK,IAAIe,IAAI,CAAb,EAAgBA,IAAIf,KAAKC,MAAzB,EAAiCc,GAAjC,EAAsC;AACpC,SAAK,IAAIC,IAAI,CAAb,EAAgBA,IAAIhB,KAAKe,CAAL,EAAQd,MAA5B,EAAoCe,GAApC,EAAyC;AACvC;AACA;AACA;AACA;AACA,UAAI,CAAChB,KAAKe,CAAL,EAAQC,CAAR,CAAD,IAAenB,UAAUoB,QAAV,CAAmBjB,KAAKe,CAAL,EAAQC,CAAR,CAAnB,CAAnB,EAAmD;AACjDhB,aAAKe,CAAL,EAAQC,CAAR,IAAa,IAAb;AACD;AACF;AACF;AACF;AACD;;;;;;;;AAQO,SAAS3B,uBAAT,CAAiCW,IAAjC,EAAuCa,KAAvC,EAA8CE,CAA9C,EAAiD;AACtD,MAAMG,aAAa,CAAC,GAAD,EAAM,GAAN,CAAnB;;AAEAlB,OAAKM,OAAL,CAAa,eAAO;AAClB,QAAIa,IAAIJ,CAAJ,MAAW,IAAf,EAAqB;AACnB,cAAQF,MAAMO,IAAd;AACE,aAAKC,iCAAgBC,IAArB;AACEH,cAAIJ,CAAJ,IAASQ,WAAWJ,IAAIJ,CAAJ,CAAX,CAAT;AACA;;AAEF;AACA;AACA,aAAKM,iCAAgBG,SAArB;AACEL,cAAIJ,CAAJ,IAASG,WAAWD,QAAX,CAAoBJ,MAAMY,MAA1B,IAAoCC,OAAOP,IAAIJ,CAAJ,CAAP,CAApC,GAAqDI,IAAIJ,CAAJ,CAA9D;AACA;;AAEF,aAAKM,iCAAgBM,OAArB;AACER,cAAIJ,CAAJ,IAASa,SAAST,IAAIJ,CAAJ,CAAT,EAAiB,EAAjB,CAAT;AACA;;AAEF,aAAKM,iCAAgBQ,OAArB;AACE;AACAV,cAAIJ,CAAJ,IAASI,IAAIJ,CAAJ,MAAW,MAAX,IAAqBI,IAAIJ,CAAJ,MAAW,MAAhC,IAA0CI,IAAIJ,CAAJ,MAAW,GAA9D;AACA;;AAEF;AACE;AArBJ;AAuBD;AACF,GA1BD;AA2BD;;AAED;;;;;;;AAOO,SAASzB,iBAAT,CAA2BwC,IAA3B,EAAiCC,UAAjC,EAA6C;AAClD;AACA,MAAMC,WAAWC,uBAASC,cAAT,CAAwBJ,IAAxB,EAA8B,CAC7C,EAACK,OAAO,uBAAR,EAAiCC,UAAU,UAA3C,EAD6C,CAA9B,CAAjB;;AAFkD,8BAM3B7C,sBAAsBwC,UAAtB,CAN2B;AAAA,MAM3CM,YAN2C,yBAM3CA,YAN2C;;AAQlD,SAAON,WAAWO,MAAX,CAAkB,UAACC,YAAD,EAAe1B,KAAf,EAAsB2B,KAAtB,EAAgC;AACvD,QAAMC,OAAOJ,aAAaG,KAAb,CAAb;AACA,QAAME,YAAYV,SAASW,IAAT,CAAc;AAAA,aAAKC,EAAEC,GAAF,KAAUhC,KAAf;AAAA,KAAd,CAAlB;;AAFuD,gBAGhC6B,aAAa,EAHmB;AAAA,QAGhDtB,IAHgD,SAGhDA,IAHgD;AAAA,QAG1CK,MAH0C,SAG1CA,MAH0C;;AAKvDc,iBAAaC,KAAb,IAAsB;AACpBC,gBADoB;AAEpBhB,oBAFoB;;AAIpB;AACA;AACAqB,uBAAiBN,QAAQ,CANL;AAOpBpB,YAAM5B,wBAAwB4B,IAAxB;AAPc,KAAtB;;AAUA,WAAOmB,YAAP;AACD,GAhBM,EAgBJ,EAhBI,CAAP;AAiBD;;AAED;;;;;;;AAOO,SAAShD,qBAAT,CAA+BwC,UAA/B,EAA2C;AAChD,SAAOA,WAAWO,MAAX,CACL,UAACS,IAAD,EAAOlC,KAAP,EAAcE,CAAd,EAAoB;AAAA,QACXiC,QADW,GACCD,IADD,CACXC,QADW;;AAElB,QAAIC,YAAYpC,KAAhB;;AAEA;AACA,QAAImC,SAAS/B,QAAT,CAAkBJ,KAAlB,CAAJ,EAA8B;AAC5B,UAAIqC,UAAU,CAAd;AACA,aAAOF,SAAS/B,QAAT,CAAqBJ,KAArB,SAA8BqC,OAA9B,CAAP,EAAiD;AAC/CA;AACD;AACDD,kBAAepC,KAAf,SAAwBqC,OAAxB;AACD;;AAEDH,SAAKV,YAAL,CAAkBtB,CAAlB,IAAuBkC,SAAvB;AACAF,SAAKC,QAAL,CAAcG,IAAd,CAAmBF,SAAnB;;AAEA,WAAOF,IAAP;AACD,GAlBI,EAmBL,EAACC,UAAU,EAAX,EAAeX,cAAc,EAA7B,EAnBK,CAAP;AAqBD;;AAED;;;;;;AAMA;AACO,SAAS7C,uBAAT,CAAiC4D,KAAjC,EAAwC;AAAA,MAE3CC,IAF2C,GAezCC,wBAfyC,CAE3CD,IAF2C;AAAA,MAG3CE,IAH2C,GAezCD,wBAfyC,CAG3CC,IAH2C;AAAA,MAI3CC,QAJ2C,GAezCF,wBAfyC,CAI3CE,QAJ2C;AAAA,MAK3CC,MAL2C,GAezCH,wBAfyC,CAK3CG,MAL2C;AAAA,MAM3CC,GAN2C,GAezCJ,wBAfyC,CAM3CI,GAN2C;AAAA,MAO3CC,KAP2C,GAezCL,wBAfyC,CAO3CK,KAP2C;AAAA,MAQ3CC,OAR2C,GAezCN,wBAfyC,CAQ3CM,OAR2C;AAAA,MAS3CC,MAT2C,GAezCP,wBAfyC,CAS3CO,MAT2C;AAAA,MAU3CC,IAV2C,GAezCR,wBAfyC,CAU3CQ,IAV2C;AAAA,MAW3CC,QAX2C,GAezCT,wBAfyC,CAW3CS,QAX2C;AAAA,MAY3CC,oBAZ2C,GAezCV,wBAfyC,CAY3CU,oBAZ2C;AAAA,MAa3CC,OAb2C,GAezCX,wBAfyC,CAa3CW,OAb2C;AAAA,MAc3CC,yBAd2C,GAezCZ,wBAfyC,CAc3CY,yBAd2C;;AAiB7C;AACA;;AACA,UAAQd,KAAR;AACE,SAAKC,IAAL;AACE,aAAOhC,iCAAgB8C,IAAvB;AACF,SAAKZ,IAAL;AACA,SAAKC,QAAL;AACE,aAAOnC,iCAAgBG,SAAvB;AACF,SAAKiC,MAAL;AACA,SAAKE,KAAL;AACE,aAAOtC,iCAAgBC,IAAvB;AACF,SAAKoC,GAAL;AACE,aAAOrC,iCAAgBM,OAAvB;AACF,SAAKiC,OAAL;AACE,aAAOvC,iCAAgBQ,OAAvB;AACF,SAAKkC,QAAL;AACA,SAAKC,oBAAL;AACA,SAAKE,yBAAL;AACE,aAAO7C,iCAAgB+C,OAAvB;AACF,SAAKP,MAAL;AACA,SAAKC,IAAL;AACA,SAAKG,OAAL;AACE,aAAO5C,iCAAgBgD,MAAvB;AACF;AACEC,sBAAcC,IAAd,iCAAiDnB,KAAjD;AACA,aAAO/B,iCAAgBgD,MAAvB;AAvBJ;AAyBD;AACD;;AAEA;;;AAGO,SAAS5E,gBAAT,CAA0BK,OAA1B,EAAmC;AACxC,MAAI,CAACA,QAAQG,MAAb,EAAqB;AACnB,WAAO,IAAP;AACD;;AAED,MAAMuE,OAAOC,OAAOD,IAAP,CAAY1E,QAAQ,CAAR,CAAZ,CAAb;AACA,MAAME,OAAOF,QAAQc,GAAR,CAAY;AAAA,WAAK4D,KAAK5D,GAAL,CAAS;AAAA,aAAO8D,EAAE7B,GAAF,CAAP;AAAA,KAAT,CAAL;AAAA,GAAZ,CAAb;AACA,MAAMzC,SAASd,kBAAkBQ,OAAlB,EAA2B0E,IAA3B,CAAf;;AAEA,SAAO;AACLpE,kBADK;AAELJ;AAFK,GAAP;AAID;;AAEM,SAASN,cAAT,CAAwBI,OAAxB,EAAiC;AACtC,MAAM6E,oBAAoB,gCAAU7E,OAAV,CAA1B;;AAEA,MAAI,CAAC6E,iBAAD,IAAsB,CAACC,MAAMC,OAAN,CAAcF,kBAAkBG,QAAhC,CAA3B,EAAsE;AACpE;AACA,WAAO,IAAP;AACD;;AAED;AACA,MAAMzE,UAAUsE,kBAAkBG,QAAlB,CAA2BxC,MAA3B,CAAkC,UAACS,IAAD,EAAOgC,CAAP,EAAUhE,CAAV,EAAgB;AAChE,QAAIgE,EAAEC,QAAN,EAAgB;AACdjC,WAAKI,IAAL;AACE;AACA8B,kBAAUF;AAFZ,SAGMA,EAAEG,UAAF,IAAgB,EAHtB;AAKD;AACD,WAAOnC,IAAP;AACD,GATe,EASb,EATa,CAAhB;;AAWA;AACA,MAAM3C,SAASC,QAAQiC,MAAR,CAAe,UAAC6C,IAAD,EAAOC,IAAP,EAAgB;AAC5CX,WAAOD,IAAP,CAAYY,IAAZ,EAAkB9E,OAAlB,CAA0B,eAAO;AAC/B,UAAI,CAAC6E,KAAKlE,QAAL,CAAc4B,GAAd,CAAL,EAAyB;AACvBsC,aAAKhC,IAAL,CAAUN,GAAV;AACD;AACF,KAJD;AAKA,WAAOsC,IAAP;AACD,GAPc,EAOZ,EAPY,CAAf;;AASA;AACA9E,UAAQC,OAAR,CAAgB,aAAK;AACnBF,WAAOE,OAAP,CAAe,aAAK;AAClB,UAAI,EAAEyE,KAAKL,CAAP,CAAJ,EAAe;AACbA,UAAEK,CAAF,IAAO,IAAP;AACD;AACF,KAJD;AAKD,GAND;;AAQA,SAAOtF,iBAAiBY,OAAjB,CAAP;AACD;;AAED;;;;;AAKO,SAASV,SAAT,CAAmBmC,IAAnB,EAAyB1B,MAAzB,EAAiC;AACtC,MAAMiF,UAAUjF,OAAOQ,GAAP,CAAW;AAAA,WAAKmE,EAAEtC,IAAP;AAAA,GAAX,CAAhB;AACA,MAAM6C,gBAAgB,CAACD,OAAD,CAAtB;;AAEA;AACAvD,OAAKxB,OAAL,CAAa,eAAO;AAClBgF,kBAAcnC,IAAd,CACEhC,IAAIP,GAAJ,CACE,UAAC8D,CAAD,EAAI3D,CAAJ;AAAA,aAAU2D,KAAKa,gCAAenB,OAAf,CAAuBnD,QAAvB,CAAgCb,OAAOW,CAAP,EAAU0B,IAA1C,CAAL,GACR+C,KAAKC,SAAL,CAAef,CAAf,CADQ,GACYA,CADtB;AAAA,KADF,CADF;AAMD,GAPD;;AASA,SAAO,0BAAcY,aAAd,CAAP;AACD;;AAED;;;;AAIO,SAAS1F,iBAAT,CAA2BkC,IAA3B,EAAiC;AACtC;AACA;;;;;;;AAOA,MAAI4D,UAAU,IAAd;AACA,MAAI,CAAC5D,IAAL,EAAW;AACT,0BAAO,qCAAP;AACA4D,cAAU,KAAV;AACD,GAHD,MAGO,IAAI,CAACd,MAAMC,OAAN,CAAc/C,KAAK1B,MAAnB,CAAL,EAAiC;AACtC,0BAAO,mDAAP;AACAsF,cAAU,KAAV;AACD,GAHM,MAGA,IAAI,CAACd,MAAMC,OAAN,CAAc/C,KAAK9B,IAAnB,CAAL,EAA+B;AACpC,0BAAO,iDAAP;AACA0F,cAAU,KAAV;AACD;;AAED,MAAI,CAACA,OAAL,EAAc;AACZ,WAAO,IAAP;AACD;;AAvBqC,MAyB/BtF,MAzB+B,GAyBf0B,IAzBe,CAyB/B1B,MAzB+B;AAAA,MAyBvBJ,IAzBuB,GAyBf8B,IAzBe,CAyBvB9B,IAzBuB;;AA2BtC;;AACA,MAAM2F,WAAWvF,OAAOwF,KAAP,CAAa,UAACb,CAAD,EAAIhE,CAAJ,EAAU;AACtC,QAAI,QAAOgE,CAAP,uDAAOA,CAAP,OAAa,QAAjB,EAA2B;AACzB,iFAA0DA,CAA1D;AACA,aAAO,KAAP;AACD;;AAED,QAAI,CAACA,EAAEtC,IAAP,EAAa;AACX,6EACiD+C,KAAKC,SAAL,CAAeV,CAAf,CADjD;AAGA;AACAA,QAAEtC,IAAF,eAAmB1B,CAAnB;AACD;;AAED,QAAI,CAACM,iCAAgB0D,EAAE3D,IAAlB,CAAL,EAA8B;AAC5B,oDAA6B2D,EAAE3D,IAA/B;AACA,aAAO,KAAP;AACD;;AAED,WAAO2D,EAAE3D,IAAF,IAAU2D,EAAEtD,MAAZ,IAAsBsD,EAAEtC,IAA/B;AACD,GApBgB,CAAjB;;AAsBA,MAAIkD,QAAJ,EAAc;AACZ,WAAO,EAAC3F,UAAD,EAAOI,cAAP,EAAP;AACD;;AAED;AACA;AACA,MAAMyF,aAAazG,wBAAwB,EAACgB,QAAQA,OAAOQ,GAAP,CAAW;AAAA,aAAKmE,EAAEtC,IAAP;AAAA,KAAX,CAAT,EAAkCpC,SAASL,IAA3C,EAAxB,CAAnB;AACA,MAAM+B,aAAa3B,OAAOQ,GAAP,CAAW;AAAA,WAAKmE,EAAEtC,IAAP;AAAA,GAAX,CAAnB;AACA,MAAMqD,OAAOxG,kBAAkBuG,UAAlB,EAA8B9D,UAA9B,CAAb;AACA,MAAMgE,gBAAgB3F,OAAOQ,GAAP,CAAW,UAACmE,CAAD,EAAIhE,CAAJ;AAAA,sCAC5BgE,CAD4B;AAE/B3D,YAAM0E,KAAK/E,CAAL,EAAQK,IAFiB;AAG/BK,cAAQqE,KAAK/E,CAAL,EAAQU;AAHe;AAAA,GAAX,CAAtB;;AAMA,SAAO,EAACrB,QAAQ2F,aAAT,EAAwB/F,UAAxB,EAAP;AACD;;kBAEc;AACbN,gCADa;AAEbP,gCAFa;AAGbM,oCAHa;AAIbD,kDAJa;AAKbF,sCALa;AAMbD;AANa,C","file":"data-processor.js","sourcesContent":["// Copyright (c) 2018 Uber Technologies, Inc.\n//\n// Permission is hereby granted, free of charge, to any person obtaining a copy\n// of this software and associated documentation files (the \"Software\"), to deal\n// in the Software without restriction, including without limitation the rights\n// to use, copy, modify, merge, publish, distribute, sublicense, and/or sell\n// copies of the Software, and to permit persons to whom the Software is\n// furnished to do so, subject to the following conditions:\n//\n// The above copyright notice and this permission notice shall be included in\n// all copies or substantial portions of the Software.\n//\n// THE SOFTWARE IS PROVIDED \"AS IS\", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR\n// IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,\n// FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE\n// AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER\n// LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,\n// OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN\n// THE SOFTWARE.\n\nimport {csvParseRows, csvFormatRows} from 'd3-dsv';\nimport {range} from 'd3-array';\nimport {console as globalConsole} from 'global/window';\nimport assert from 'assert';\nimport {Analyzer, DATA_TYPES as AnalyzerDATA_TYPES} from 'type-analyzer';\nimport normalize from '@mapbox/geojson-normalize';\nimport {ALL_FIELD_TYPES, GEOJSON_FIELDS} from 'constants/default-settings';\nimport {notNullorUndefined} from 'utils/data-utils';\n\n// if any of these value occurs in csv, parse it to null;\nconst CSV_NULLS = ['', 'null', 'NULL', 'Null', 'NaN'];\n\nexport function processCsvData(rawData) {\n\n  // here we assume the csv file that people uploaded will have first row\n  // as name of the column\n  //TODO: add a alert at upload csv to remind define first row\n  const [headerRow, ...rows] = csvParseRows(rawData);\n\n  if (!rows.length || !headerRow) {\n    // looks like an empty file\n    // resolve null, and catch them later in one place\n    return null;\n  }\n\n  cleanUpFalsyCsvValue(rows);\n  // No need to run type detection on every data point\n  // here we get a list of none null values to run analyze on\n  const sample = getSampleForTypeAnalyze({fields: headerRow, allData: rows});\n\n  const fields = getFieldsFromData(sample, headerRow);\n\n  fields.forEach(parseCsvDataByFieldType.bind(null, rows));\n\n  return {fields, rows};\n}\n\n/**\n * get fields from csv data\n *\n * @param {array} fields - an array of fields name\n * @param {array} allData\n * @param {array} sampleCount\n * @returns {array} formatted fields\n */\nexport function getSampleForTypeAnalyze({fields, allData, sampleCount = 50}) {\n  const total = Math.min(sampleCount, allData.length);\n  // const fieldOrder = fields.map(f => f.name);\n  const sample = range(0, total, 1).map(d => ({}));\n\n  // collect sample data for each field\n  fields.forEach((field, fieldIdx) => {\n    // data counter\n    let i = 0;\n    // sample counter\n    let j = 0;\n\n    while (j < total) {\n      if (i >= allData.length) {\n        // if depleted data pool\n        sample[j][field] = null;\n        j++;\n      } else if (notNullorUndefined(allData[i][fieldIdx])) {\n        sample[j][field] = allData[i][fieldIdx];\n        j++;\n        i++;\n      } else {\n        i++;\n      }\n    }\n  });\n\n  return sample;\n}\n\nfunction cleanUpFalsyCsvValue(rows) {\n  for (let i = 0; i < rows.length; i++) {\n    for (let j = 0; j < rows[i].length; j++) {\n      // analyzer will set any fields to 'string' if there are empty values\n      // which will be parsed as '' by d3.csv\n      // here we parse empty data as null\n      // TODO: create warning when deltect `CSV_NULLS` in the data\n      if (!rows[i][j] || CSV_NULLS.includes(rows[i][j])) {\n        rows[i][j] = null;\n      }\n    }\n  }\n}\n/**\n * Process uploaded csv file to parse value by field type\n *\n * @param {array} rows\n * @param {object} field\n * @param {number} i\n * @returns {void}\n */\nexport function parseCsvDataByFieldType(rows, field, i) {\n  const unixFormat = ['x', 'X'];\n\n  rows.forEach(row => {\n    if (row[i] !== null) {\n      switch (field.type) {\n        case ALL_FIELD_TYPES.real:\n          row[i] = parseFloat(row[i]);\n          break;\n\n        // TODO: timestamp can be either '1495827326' or '2016-03-10 11:20'\n        // if it's '1495827326' we pass it to int\n        case ALL_FIELD_TYPES.timestamp:\n          row[i] = unixFormat.includes(field.format) ? Number(row[i]) : row[i];\n          break;\n\n        case ALL_FIELD_TYPES.integer:\n          row[i] = parseInt(row[i], 10);\n          break;\n\n        case ALL_FIELD_TYPES.boolean:\n          // 0 and 1 only field can also be boolean\n          row[i] = row[i] === 'true' || row[i] === 'True' || row[i] === '1';\n          break;\n\n        default:\n          break;\n      }\n    }\n  });\n}\n\n/**\n * get fields from csv data\n *\n * @param {array} data\n * @param {array} fieldOrder\n * @returns {array} formatted fields\n */\nexport function getFieldsFromData(data, fieldOrder) {\n  // add a check for epoch timestamp\n  const metadata = Analyzer.computeColMeta(data, [\n    {regex: /.*geojson|all_points/g, dataType: 'GEOMETRY'}\n  ]);\n\n  const {fieldByIndex} = renameDuplicateFields(fieldOrder);\n\n  return fieldOrder.reduce((orderedArray, field, index) => {\n    const name = fieldByIndex[index];\n    const fieldMeta = metadata.find(m => m.key === field);\n    const {type, format} = fieldMeta || {};\n\n    orderedArray[index] = {\n      name,\n      format,\n\n      // need this for mapbuilder conversion: filter type detection\n      // category,\n      tableFieldIndex: index + 1,\n      type: analyzerTypeToFieldType(type)\n    };\n\n    return orderedArray;\n  }, []);\n}\n\n/**\n * pass in an array of field names, rename duplicated one\n * and return a map from old field index to new name\n *\n * @param {array} fieldOrder\n * @returns {Object} new field name by index\n */\nexport function renameDuplicateFields(fieldOrder) {\n  return fieldOrder.reduce(\n    (accu, field, i) => {\n      const {allNames} = accu;\n      let fieldName = field;\n\n      // add a counter to duplicated names\n      if (allNames.includes(field)) {\n        let counter = 0;\n        while (allNames.includes(`${field}-${counter}`)) {\n          counter++;\n        }\n        fieldName = `${field}-${counter}`;\n      }\n\n      accu.fieldByIndex[i] = fieldName;\n      accu.allNames.push(fieldName);\n\n      return accu;\n    },\n    {allNames: [], fieldByIndex: {}}\n  );\n}\n\n/**\n * Map Analyzer types to local field types\n *\n * @param {string} aType\n * @returns {string} corresponding type in ALL_FIELD_TYPES\n */\n/* eslint-disable complexity */\nexport function analyzerTypeToFieldType(aType) {\n  const {\n    DATE,\n    TIME,\n    DATETIME,\n    NUMBER,\n    INT,\n    FLOAT,\n    BOOLEAN,\n    STRING,\n    CITY,\n    GEOMETRY,\n    GEOMETRY_FROM_STRING,\n    ZIPCODE,\n    PAIR_GEOMETRY_FROM_STRING\n  } = AnalyzerDATA_TYPES;\n\n  // TODO: un recognized types\n  // CURRENCY PERCENT NONE\n  switch (aType) {\n    case DATE:\n      return ALL_FIELD_TYPES.date;\n    case TIME:\n    case DATETIME:\n      return ALL_FIELD_TYPES.timestamp;\n    case NUMBER:\n    case FLOAT:\n      return ALL_FIELD_TYPES.real;\n    case INT:\n      return ALL_FIELD_TYPES.integer;\n    case BOOLEAN:\n      return ALL_FIELD_TYPES.boolean;\n    case GEOMETRY:\n    case GEOMETRY_FROM_STRING:\n    case PAIR_GEOMETRY_FROM_STRING:\n      return ALL_FIELD_TYPES.geojson;\n    case STRING:\n    case CITY:\n    case ZIPCODE:\n      return ALL_FIELD_TYPES.string;\n    default:\n      globalConsole.warn(`Unsupported analyzer type: ${aType}`);\n      return ALL_FIELD_TYPES.string;\n  }\n}\n/* eslint-enable complexity */\n\n/*\n * Process rawData where each row is an object\n */\nexport function processRowObject(rawData) {\n  if (!rawData.length) {\n    return null;\n  }\n\n  const keys = Object.keys(rawData[0]);\n  const rows = rawData.map(d => keys.map(key => d[key]));\n  const fields = getFieldsFromData(rawData, keys);\n\n  return {\n    fields,\n    rows\n  };\n}\n\nexport function processGeojson(rawData) {\n  const normalizedGeojson = normalize(rawData);\n\n  if (!normalizedGeojson || !Array.isArray(normalizedGeojson.features)) {\n    // fail to normalize geojson\n    return null;\n  }\n\n  // getting all feature fields\n  const allData = normalizedGeojson.features.reduce((accu, f, i) => {\n    if (f.geometry) {\n      accu.push({\n        // add feature to _geojson field\n        _geojson: f,\n        ...(f.properties || {})\n      });\n    }\n    return accu;\n  }, []);\n\n  // get all the field\n  const fields = allData.reduce((prev, curr) => {\n    Object.keys(curr).forEach(key => {\n      if (!prev.includes(key)) {\n        prev.push(key);\n      }\n    });\n    return prev;\n  }, []);\n\n  // make sure each feature has exact same fields\n  allData.forEach(d => {\n    fields.forEach(f => {\n      if (!(f in d)) {\n        d[f] = null;\n      }\n    });\n  });\n\n  return processRowObject(allData);\n}\n\n/**\n * On export data to csv\n * @param data\n * @param fields\n */\nexport function formatCsv(data, fields) {\n  const columns = fields.map(f => f.name);\n  const formattedData = [columns];\n\n  // parse geojson object as string\n  data.forEach(row => {\n    formattedData.push(\n      row.map(\n        (d, i) => d && GEOJSON_FIELDS.geojson.includes(fields[i].name) ?\n          JSON.stringify(d) : d\n      )\n    )\n  });\n\n  return csvFormatRows(formattedData);\n}\n\n/**\n * @param data\n * @returns {{allData: Array, fields: Array}}\n */\nexport function validateInputData(data) {\n  // TODO: add test\n  /*\n   * expected input data format\n   * {\n   *   fields: [],\n   *   rows: []\n   * }\n   */\n  let proceed = true;\n  if (!data) {\n    assert('receiveVisData: data cannot be null');\n    proceed = false;\n  } else if (!Array.isArray(data.fields)) {\n    assert('receiveVisData: expect data.fields to be an array');\n    proceed = false;\n  } else if (!Array.isArray(data.rows)) {\n    assert('receiveVisData: expect data.rows to be an array');\n    proceed = false;\n  }\n\n  if (!proceed) {\n    return null;\n  }\n\n  const {fields, rows} = data;\n\n  // check if all fields has name, format and type\n  const allValid = fields.every((f, i) => {\n    if (typeof f !== 'object') {\n      assert(`fields needs to be an array of object, but find ${f}`);\n      return false;\n    }\n\n    if (!f.name) {\n      assert(\n        `field.name is required but missing in field ${JSON.stringify(f)}`\n      );\n      // assign a name\n      f.name = `column_${i}`;\n    }\n\n    if (!ALL_FIELD_TYPES[f.type]) {\n      assert(`unknown field type ${f.type}`);\n      return false;\n    }\n\n    return f.type && f.format && f.name;\n  });\n\n  if (allValid) {\n    return {rows, fields};\n  }\n\n  // if any field has missing type, recalculate it for everyone\n  // because we simply lost faith in humanity\n  const sampleData = getSampleForTypeAnalyze({fields: fields.map(f => f.name), allData: rows});\n  const fieldOrder = fields.map(f => f.name);\n  const meta = getFieldsFromData(sampleData, fieldOrder);\n  const updatedFields = fields.map((f, i) => ({\n    ...f,\n    type: meta[i].type,\n    format: meta[i].format\n  }));\n\n  return {fields: updatedFields, rows};\n}\n\nexport default {\n  processGeojson,\n  processCsvData,\n  processRowObject,\n  analyzerTypeToFieldType,\n  getFieldsFromData,\n  parseCsvDataByFieldType\n};\n"]}
;