UNPKG

@dpkit/table

Version:

Data Package implementation in TypeScript.

244 lines 32.7 kB
import { DataFrame, Series } from "nodejs-polars"; import { DataType } from "nodejs-polars"; import { describe, expect, it } from "vitest"; import { inferSchema } from "./infer.js"; describe("inferSchema", () => { it("should infer from native types", async () => { const table = DataFrame({ integer: Series("integer", [1, 2], DataType.Int32), number: [1.1, 2.2], }).lazy(); const schema = { fields: [ { name: "integer", type: "integer" }, { name: "number", type: "number" }, ], }; expect(await inferSchema(table)).toEqual(schema); }); it("should infer numeric", async () => { const table = DataFrame({ name1: ["1", "2", "3"], name2: ["1,1", "2,2", "3,3"], name3: ["1.1", "2.2", "3.3"], name4: ["1,000.1", "2,000.2", "3,000.3"], }).lazy(); const schema = { fields: [ { name: "name1", type: "integer" }, { name: "name2", type: "integer", groupChar: "," }, { name: "name3", type: "number" }, { name: "name4", type: "number", groupChar: "," }, ], }; expect(await inferSchema(table)).toEqual(schema); }); it("should infer numeric (commaDecimal)", async () => { const table = DataFrame({ name1: ["1.1", "2.2", "3.3"], name2: ["1.1,0", "2.2,0", "3.3,0"], }).lazy(); const schema = { fields: [ { name: "name1", type: "integer", groupChar: "." }, { name: "name2", type: "number", decimalChar: ",", groupChar: "." }, ], }; expect(await inferSchema(table, { commaDecimal: true })).toEqual(schema); }); it("should infer booleans", async () => { const table = DataFrame({ name1: ["true", "True", "TRUE"], name2: ["false", "False", "FALSE"], }).lazy(); const schema = { fields: [ { name: "name1", type: "boolean" }, { name: "name2", type: "boolean" }, ], }; expect(await inferSchema(table)).toEqual(schema); }); it("should infer objects", async () => { const table = DataFrame({ name1: ['{"a": 1}'], name2: ["{}"], }).lazy(); const schema = { fields: [ { name: "name1", type: "object" }, { name: "name2", type: "object" }, ], }; expect(await inferSchema(table)).toEqual(schema); }); it("should infer arrays", async () => { const table = DataFrame({ name1: ["[1,2,3]"], name2: ["[]"], }).lazy(); const schema = { fields: [ { name: "name1", type: "array" }, { name: "name2", type: "array" }, ], }; expect(await inferSchema(table)).toEqual(schema); }); it("should infer dates with ISO format", async () => { const table = DataFrame({ name1: ["2023-01-15", "2023-02-20", "2023-03-25"], }).lazy(); const schema = { fields: [{ name: "name1", type: "date" }], }; expect(await inferSchema(table)).toEqual(schema); }); it("should infer dates with slash format", async () => { const table = DataFrame({ yearFirst: ["2023/01/15", "2023/02/20", "2023/03/25"], dayMonth: ["15/01/2023", "20/02/2023", "25/03/2023"], monthDay: ["01/15/2023", "02/20/2023", "03/25/2023"], }).lazy(); const schemaDefault = { fields: [ { name: "yearFirst", type: "date", format: "%Y/%m/%d" }, { name: "dayMonth", type: "date", format: "%d/%m/%Y" }, { name: "monthDay", type: "date", format: "%d/%m/%Y" }, ], }; const schemaMonthFirst = { fields: [ { name: "yearFirst", type: "date", format: "%Y/%m/%d" }, { name: "dayMonth", type: "date", format: "%m/%d/%Y" }, { name: "monthDay", type: "date", format: "%m/%d/%Y" }, ], }; expect(await inferSchema(table)).toEqual(schemaDefault); expect(await inferSchema(table, { monthFirst: true })).toEqual(schemaMonthFirst); }); it("should infer dates with hyphen format", async () => { const table = DataFrame({ dayMonth: ["15-01-2023", "20-02-2023", "25-03-2023"], }).lazy(); const schemaDefault = { fields: [{ name: "dayMonth", type: "date", format: "%d-%m-%Y" }], }; const schemaMonthFirst = { fields: [{ name: "dayMonth", type: "date", format: "%m-%d-%Y" }], }; expect(await inferSchema(table)).toEqual(schemaDefault); expect(await inferSchema(table, { monthFirst: true })).toEqual(schemaMonthFirst); }); it("should infer times with standard format", async () => { const table = DataFrame({ fullTime: ["14:30:45", "08:15:30", "23:59:59"], shortTime: ["14:30", "08:15", "23:59"], }).lazy(); const schema = { fields: [ { name: "fullTime", type: "time" }, { name: "shortTime", type: "time", format: "%H:%M" }, ], }; expect(await inferSchema(table)).toEqual(schema); }); it("should infer times with 12-hour format", async () => { const table = DataFrame({ fullTime: ["2:30:45 PM", "8:15:30 AM", "11:59:59 PM"], shortTime: ["2:30 PM", "8:15 AM", "11:59 PM"], }).lazy(); const schema = { fields: [ { name: "fullTime", type: "time", format: "%I:%M:%S %p" }, { name: "shortTime", type: "time", format: "%I:%M %p" }, ], }; expect(await inferSchema(table)).toEqual(schema); }); it("should infer times with timezone offset", async () => { const table = DataFrame({ name: ["14:30:45+01:00", "08:15:30-05:00", "23:59:59+00:00"], }).lazy(); const schema = { fields: [{ name: "name", type: "time" }], }; expect(await inferSchema(table)).toEqual(schema); }); it("should infer datetimes with ISO format", async () => { const table = DataFrame({ standard: [ "2023-01-15T14:30:45", "2023-02-20T08:15:30", "2023-03-25T23:59:59", ], utc: [ "2023-01-15T14:30:45Z", "2023-02-20T08:15:30Z", "2023-03-25T23:59:59Z", ], withTz: [ "2023-01-15T14:30:45+01:00", "2023-02-20T08:15:30-05:00", "2023-03-25T23:59:59+00:00", ], withSpace: [ "2023-01-15 14:30:45", "2023-02-20 08:15:30", "2023-03-25 23:59:59", ], }).lazy(); const schema = { fields: [ { name: "standard", type: "datetime" }, { name: "utc", type: "datetime" }, { name: "withTz", type: "datetime" }, { name: "withSpace", type: "datetime", format: "%Y-%m-%d %H:%M:%S" }, ], }; expect(await inferSchema(table)).toEqual(schema); }); it("should infer datetimes with custom formats", async () => { const table = DataFrame({ shortDayMonth: [ "15/01/2023 14:30", "20/02/2023 08:15", "25/03/2023 23:59", ], fullDayMonth: [ "15/01/2023 14:30:45", "20/02/2023 08:15:30", "25/03/2023 23:59:59", ], shortMonthDay: [ "01/15/2023 14:30", "02/20/2023 08:15", "03/25/2023 23:59", ], fullMonthDay: [ "01/15/2023 14:30:45", "02/20/2023 08:15:30", "03/25/2023 23:59:59", ], }).lazy(); const schemaDefault = { fields: [ { name: "shortDayMonth", type: "datetime", format: "%d/%m/%Y %H:%M" }, { name: "fullDayMonth", type: "datetime", format: "%d/%m/%Y %H:%M:%S" }, { name: "shortMonthDay", type: "datetime", format: "%d/%m/%Y %H:%M" }, { name: "fullMonthDay", type: "datetime", format: "%d/%m/%Y %H:%M:%S" }, ], }; const schemaMonthFirst = { fields: [ { name: "shortDayMonth", type: "datetime", format: "%m/%d/%Y %H:%M" }, { name: "fullDayMonth", type: "datetime", format: "%m/%d/%Y %H:%M:%S" }, { name: "shortMonthDay", type: "datetime", format: "%m/%d/%Y %H:%M" }, { name: "fullMonthDay", type: "datetime", format: "%m/%d/%Y %H:%M:%S" }, ], }; expect(await inferSchema(table)).toEqual(schemaDefault); expect(await inferSchema(table, { monthFirst: true })).toEqual(schemaMonthFirst); }); }); //# sourceMappingURL=data:application/json;base64,{"version":3,"file":"infer.spec.js","sourceRoot":"","sources":["../../schema/infer.spec.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,SAAS,EAAE,MAAM,EAAE,MAAM,eAAe,CAAA;AACjD,OAAO,EAAE,QAAQ,EAAE,MAAM,eAAe,CAAA;AACxC,OAAO,EAAE,QAAQ,EAAE,MAAM,EAAE,EAAE,EAAE,MAAM,QAAQ,CAAA;AAC7C,OAAO,EAAE,WAAW,EAAE,MAAM,YAAY,CAAA;AAExC,QAAQ,CAAC,aAAa,EAAE,GAAG,EAAE;IAC3B,EAAE,CAAC,gCAAgC,EAAE,KAAK,IAAI,EAAE;QAC9C,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,OAAO,EAAE,MAAM,CAAC,SAAS,EAAE,CAAC,CAAC,EAAE,CAAC,CAAC,EAAE,QAAQ,CAAC,KAAK,CAAC;YAClD,MAAM,EAAE,CAAC,GAAG,EAAE,GAAG,CAAC;SACnB,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,MAAM,GAAG;YACb,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,SAAS,EAAE,IAAI,EAAE,SAAS,EAAE;gBACpC,EAAE,IAAI,EAAE,QAAQ,EAAE,IAAI,EAAE,QAAQ,EAAE;aACnC;SACF,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC,CAAA;IAClD,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,sBAAsB,EAAE,KAAK,IAAI,EAAE;QACpC,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,KAAK,EAAE,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC;YACtB,KAAK,EAAE,CAAC,KAAK,EAAE,KAAK,EAAE,KAAK,CAAC;YAC5B,KAAK,EAAE,CAAC,KAAK,EAAE,KAAK,EAAE,KAAK,CAAC;YAC5B,KAAK,EAAE,CAAC,SAAS,EAAE,SAAS,EAAE,SAAS,CAAC;SACzC,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,MAAM,GAAG;YACb,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,SAAS,EAAE;gBAClC,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,SAAS,EAAE,SAAS,EAAE,GAAG,EAAE;gBAClD,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,QAAQ,EAAE;gBACjC,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,QAAQ,EAAE,SAAS,EAAE,GAAG,EAAE;aAClD;SACF,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC,CAAA;IAClD,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,qCAAqC,EAAE,KAAK,IAAI,EAAE;QACnD,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,KAAK,EAAE,CAAC,KAAK,EAAE,KAAK,EAAE,KAAK,CAAC;YAC5B,KAAK,EAAE,CAAC,OAAO,EAAE,OAAO,EAAE,OAAO,CAAC;SACnC,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,MAAM,GAAG;YACb,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,SAAS,EAAE,SAAS,EAAE,GAAG,EAAE;gBAClD,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,QAAQ,EAAE,WAAW,EAAE,GAAG,EAAE,SAAS,EAAE,GAAG,EAAE;aACpE;SACF,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,EAAE,EAAE,YAAY,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC,CAAA;IAC1E,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,uBAAuB,EAAE,KAAK,IAAI,EAAE;QACrC,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,KAAK,EAAE,CAAC,MAAM,EAAE,MAAM,EAAE,MAAM,CAAC;YAC/B,KAAK,EAAE,CAAC,OAAO,EAAE,OAAO,EAAE,OAAO,CAAC;SACnC,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,MAAM,GAAG;YACb,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,SAAS,EAAE;gBAClC,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,SAAS,EAAE;aACnC;SACF,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC,CAAA;IAClD,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,sBAAsB,EAAE,KAAK,IAAI,EAAE;QACpC,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,KAAK,EAAE,CAAC,UAAU,CAAC;YACnB,KAAK,EAAE,CAAC,IAAI,CAAC;SACd,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,MAAM,GAAG;YACb,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,QAAQ,EAAE;gBACjC,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,QAAQ,EAAE;aAClC;SACF,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC,CAAA;IAClD,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,qBAAqB,EAAE,KAAK,IAAI,EAAE;QACnC,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,KAAK,EAAE,CAAC,SAAS,CAAC;YAClB,KAAK,EAAE,CAAC,IAAI,CAAC;SACd,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,MAAM,GAAG;YACb,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,OAAO,EAAE;gBAChC,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,OAAO,EAAE;aACjC;SACF,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC,CAAA;IAClD,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,oCAAoC,EAAE,KAAK,IAAI,EAAE;QAClD,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,KAAK,EAAE,CAAC,YAAY,EAAE,YAAY,EAAE,YAAY,CAAC;SAClD,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,MAAM,GAAG;YACb,MAAM,EAAE,CAAC,EAAE,IAAI,EAAE,OAAO,EAAE,IAAI,EAAE,MAAM,EAAE,CAAC;SAC1C,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC,CAAA;IAClD,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,sCAAsC,EAAE,KAAK,IAAI,EAAE;QACpD,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,SAAS,EAAE,CAAC,YAAY,EAAE,YAAY,EAAE,YAAY,CAAC;YACrD,QAAQ,EAAE,CAAC,YAAY,EAAE,YAAY,EAAE,YAAY,CAAC;YACpD,QAAQ,EAAE,CAAC,YAAY,EAAE,YAAY,EAAE,YAAY,CAAC;SACrD,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,aAAa,GAAG;YACpB,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,WAAW,EAAE,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,UAAU,EAAE;gBACvD,EAAE,IAAI,EAAE,UAAU,EAAE,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,UAAU,EAAE;gBACtD,EAAE,IAAI,EAAE,UAAU,EAAE,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,UAAU,EAAE;aACvD;SACF,CAAA;QAED,MAAM,gBAAgB,GAAG;YACvB,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,WAAW,EAAE,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,UAAU,EAAE;gBACvD,EAAE,IAAI,EAAE,UAAU,EAAE,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,UAAU,EAAE;gBACtD,EAAE,IAAI,EAAE,UAAU,EAAE,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,UAAU,EAAE;aACvD;SACF,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,aAAa,CAAC,CAAA;QACvD,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,EAAE,EAAE,UAAU,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,OAAO,CAC5D,gBAAgB,CACjB,CAAA;IACH,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,uCAAuC,EAAE,KAAK,IAAI,EAAE;QACrD,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,QAAQ,EAAE,CAAC,YAAY,EAAE,YAAY,EAAE,YAAY,CAAC;SACrD,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,aAAa,GAAG;YACpB,MAAM,EAAE,CAAC,EAAE,IAAI,EAAE,UAAU,EAAE,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,UAAU,EAAE,CAAC;SACjE,CAAA;QAED,MAAM,gBAAgB,GAAG;YACvB,MAAM,EAAE,CAAC,EAAE,IAAI,EAAE,UAAU,EAAE,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,UAAU,EAAE,CAAC;SACjE,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,aAAa,CAAC,CAAA;QACvD,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,EAAE,EAAE,UAAU,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,OAAO,CAC5D,gBAAgB,CACjB,CAAA;IACH,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,yCAAyC,EAAE,KAAK,IAAI,EAAE;QACvD,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,QAAQ,EAAE,CAAC,UAAU,EAAE,UAAU,EAAE,UAAU,CAAC;YAC9C,SAAS,EAAE,CAAC,OAAO,EAAE,OAAO,EAAE,OAAO,CAAC;SACvC,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,MAAM,GAAG;YACb,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,UAAU,EAAE,IAAI,EAAE,MAAM,EAAE;gBAClC,EAAE,IAAI,EAAE,WAAW,EAAE,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,OAAO,EAAE;aACrD;SACF,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC,CAAA;IAClD,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,wCAAwC,EAAE,KAAK,IAAI,EAAE;QACtD,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,QAAQ,EAAE,CAAC,YAAY,EAAE,YAAY,EAAE,aAAa,CAAC;YACrD,SAAS,EAAE,CAAC,SAAS,EAAE,SAAS,EAAE,UAAU,CAAC;SAC9C,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,MAAM,GAAG;YACb,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,UAAU,EAAE,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,aAAa,EAAE;gBACzD,EAAE,IAAI,EAAE,WAAW,EAAE,IAAI,EAAE,MAAM,EAAE,MAAM,EAAE,UAAU,EAAE;aACxD;SACF,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC,CAAA;IAClD,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,yCAAyC,EAAE,KAAK,IAAI,EAAE;QACvD,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,IAAI,EAAE,CAAC,gBAAgB,EAAE,gBAAgB,EAAE,gBAAgB,CAAC;SAC7D,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,MAAM,GAAG;YACb,MAAM,EAAE,CAAC,EAAE,IAAI,EAAE,MAAM,EAAE,IAAI,EAAE,MAAM,EAAE,CAAC;SACzC,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC,CAAA;IAClD,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,wCAAwC,EAAE,KAAK,IAAI,EAAE;QACtD,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,QAAQ,EAAE;gBACR,qBAAqB;gBACrB,qBAAqB;gBACrB,qBAAqB;aACtB;YACD,GAAG,EAAE;gBACH,sBAAsB;gBACtB,sBAAsB;gBACtB,sBAAsB;aACvB;YACD,MAAM,EAAE;gBACN,2BAA2B;gBAC3B,2BAA2B;gBAC3B,2BAA2B;aAC5B;YACD,SAAS,EAAE;gBACT,qBAAqB;gBACrB,qBAAqB;gBACrB,qBAAqB;aACtB;SACF,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,MAAM,GAAG;YACb,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,UAAU,EAAE,IAAI,EAAE,UAAU,EAAE;gBACtC,EAAE,IAAI,EAAE,KAAK,EAAE,IAAI,EAAE,UAAU,EAAE;gBACjC,EAAE,IAAI,EAAE,QAAQ,EAAE,IAAI,EAAE,UAAU,EAAE;gBACpC,EAAE,IAAI,EAAE,WAAW,EAAE,IAAI,EAAE,UAAU,EAAE,MAAM,EAAE,mBAAmB,EAAE;aACrE;SACF,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,MAAM,CAAC,CAAA;IAClD,CAAC,CAAC,CAAA;IAEF,EAAE,CAAC,4CAA4C,EAAE,KAAK,IAAI,EAAE;QAC1D,MAAM,KAAK,GAAG,SAAS,CAAC;YACtB,aAAa,EAAE;gBACb,kBAAkB;gBAClB,kBAAkB;gBAClB,kBAAkB;aACnB;YACD,YAAY,EAAE;gBACZ,qBAAqB;gBACrB,qBAAqB;gBACrB,qBAAqB;aACtB;YACD,aAAa,EAAE;gBACb,kBAAkB;gBAClB,kBAAkB;gBAClB,kBAAkB;aACnB;YACD,YAAY,EAAE;gBACZ,qBAAqB;gBACrB,qBAAqB;gBACrB,qBAAqB;aACtB;SACF,CAAC,CAAC,IAAI,EAAE,CAAA;QAET,MAAM,aAAa,GAAG;YACpB,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,eAAe,EAAE,IAAI,EAAE,UAAU,EAAE,MAAM,EAAE,gBAAgB,EAAE;gBACrE,EAAE,IAAI,EAAE,cAAc,EAAE,IAAI,EAAE,UAAU,EAAE,MAAM,EAAE,mBAAmB,EAAE;gBACvE,EAAE,IAAI,EAAE,eAAe,EAAE,IAAI,EAAE,UAAU,EAAE,MAAM,EAAE,gBAAgB,EAAE;gBACrE,EAAE,IAAI,EAAE,cAAc,EAAE,IAAI,EAAE,UAAU,EAAE,MAAM,EAAE,mBAAmB,EAAE;aACxE;SACF,CAAA;QAED,MAAM,gBAAgB,GAAG;YACvB,MAAM,EAAE;gBACN,EAAE,IAAI,EAAE,eAAe,EAAE,IAAI,EAAE,UAAU,EAAE,MAAM,EAAE,gBAAgB,EAAE;gBACrE,EAAE,IAAI,EAAE,cAAc,EAAE,IAAI,EAAE,UAAU,EAAE,MAAM,EAAE,mBAAmB,EAAE;gBACvE,EAAE,IAAI,EAAE,eAAe,EAAE,IAAI,EAAE,UAAU,EAAE,MAAM,EAAE,gBAAgB,EAAE;gBACrE,EAAE,IAAI,EAAE,cAAc,EAAE,IAAI,EAAE,UAAU,EAAE,MAAM,EAAE,mBAAmB,EAAE;aACxE;SACF,CAAA;QAED,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,aAAa,CAAC,CAAA;QACvD,MAAM,CAAC,MAAM,WAAW,CAAC,KAAK,EAAE,EAAE,UAAU,EAAE,IAAI,EAAE,CAAC,CAAC,CAAC,OAAO,CAC5D,gBAAgB,CACjB,CAAA;IACH,CAAC,CAAC,CAAA;AACJ,CAAC,CAAC,CAAA","sourcesContent":["import { DataFrame, Series } from \"nodejs-polars\"\nimport { DataType } from \"nodejs-polars\"\nimport { describe, expect, it } from \"vitest\"\nimport { inferSchema } from \"./infer.ts\"\n\ndescribe(\"inferSchema\", () => {\n  it(\"should infer from native types\", async () => {\n    const table = DataFrame({\n      integer: Series(\"integer\", [1, 2], DataType.Int32),\n      number: [1.1, 2.2],\n    }).lazy()\n\n    const schema = {\n      fields: [\n        { name: \"integer\", type: \"integer\" },\n        { name: \"number\", type: \"number\" },\n      ],\n    }\n\n    expect(await inferSchema(table)).toEqual(schema)\n  })\n\n  it(\"should infer numeric\", async () => {\n    const table = DataFrame({\n      name1: [\"1\", \"2\", \"3\"],\n      name2: [\"1,1\", \"2,2\", \"3,3\"],\n      name3: [\"1.1\", \"2.2\", \"3.3\"],\n      name4: [\"1,000.1\", \"2,000.2\", \"3,000.3\"],\n    }).lazy()\n\n    const schema = {\n      fields: [\n        { name: \"name1\", type: \"integer\" },\n        { name: \"name2\", type: \"integer\", groupChar: \",\" },\n        { name: \"name3\", type: \"number\" },\n        { name: \"name4\", type: \"number\", groupChar: \",\" },\n      ],\n    }\n\n    expect(await inferSchema(table)).toEqual(schema)\n  })\n\n  it(\"should infer numeric (commaDecimal)\", async () => {\n    const table = DataFrame({\n      name1: [\"1.1\", \"2.2\", \"3.3\"],\n      name2: [\"1.1,0\", \"2.2,0\", \"3.3,0\"],\n    }).lazy()\n\n    const schema = {\n      fields: [\n        { name: \"name1\", type: \"integer\", groupChar: \".\" },\n        { name: \"name2\", type: \"number\", decimalChar: \",\", groupChar: \".\" },\n      ],\n    }\n\n    expect(await inferSchema(table, { commaDecimal: true })).toEqual(schema)\n  })\n\n  it(\"should infer booleans\", async () => {\n    const table = DataFrame({\n      name1: [\"true\", \"True\", \"TRUE\"],\n      name2: [\"false\", \"False\", \"FALSE\"],\n    }).lazy()\n\n    const schema = {\n      fields: [\n        { name: \"name1\", type: \"boolean\" },\n        { name: \"name2\", type: \"boolean\" },\n      ],\n    }\n\n    expect(await inferSchema(table)).toEqual(schema)\n  })\n\n  it(\"should infer objects\", async () => {\n    const table = DataFrame({\n      name1: ['{\"a\": 1}'],\n      name2: [\"{}\"],\n    }).lazy()\n\n    const schema = {\n      fields: [\n        { name: \"name1\", type: \"object\" },\n        { name: \"name2\", type: \"object\" },\n      ],\n    }\n\n    expect(await inferSchema(table)).toEqual(schema)\n  })\n\n  it(\"should infer arrays\", async () => {\n    const table = DataFrame({\n      name1: [\"[1,2,3]\"],\n      name2: [\"[]\"],\n    }).lazy()\n\n    const schema = {\n      fields: [\n        { name: \"name1\", type: \"array\" },\n        { name: \"name2\", type: \"array\" },\n      ],\n    }\n\n    expect(await inferSchema(table)).toEqual(schema)\n  })\n\n  it(\"should infer dates with ISO format\", async () => {\n    const table = DataFrame({\n      name1: [\"2023-01-15\", \"2023-02-20\", \"2023-03-25\"],\n    }).lazy()\n\n    const schema = {\n      fields: [{ name: \"name1\", type: \"date\" }],\n    }\n\n    expect(await inferSchema(table)).toEqual(schema)\n  })\n\n  it(\"should infer dates with slash format\", async () => {\n    const table = DataFrame({\n      yearFirst: [\"2023/01/15\", \"2023/02/20\", \"2023/03/25\"],\n      dayMonth: [\"15/01/2023\", \"20/02/2023\", \"25/03/2023\"],\n      monthDay: [\"01/15/2023\", \"02/20/2023\", \"03/25/2023\"],\n    }).lazy()\n\n    const schemaDefault = {\n      fields: [\n        { name: \"yearFirst\", type: \"date\", format: \"%Y/%m/%d\" },\n        { name: \"dayMonth\", type: \"date\", format: \"%d/%m/%Y\" },\n        { name: \"monthDay\", type: \"date\", format: \"%d/%m/%Y\" },\n      ],\n    }\n\n    const schemaMonthFirst = {\n      fields: [\n        { name: \"yearFirst\", type: \"date\", format: \"%Y/%m/%d\" },\n        { name: \"dayMonth\", type: \"date\", format: \"%m/%d/%Y\" },\n        { name: \"monthDay\", type: \"date\", format: \"%m/%d/%Y\" },\n      ],\n    }\n\n    expect(await inferSchema(table)).toEqual(schemaDefault)\n    expect(await inferSchema(table, { monthFirst: true })).toEqual(\n      schemaMonthFirst,\n    )\n  })\n\n  it(\"should infer dates with hyphen format\", async () => {\n    const table = DataFrame({\n      dayMonth: [\"15-01-2023\", \"20-02-2023\", \"25-03-2023\"],\n    }).lazy()\n\n    const schemaDefault = {\n      fields: [{ name: \"dayMonth\", type: \"date\", format: \"%d-%m-%Y\" }],\n    }\n\n    const schemaMonthFirst = {\n      fields: [{ name: \"dayMonth\", type: \"date\", format: \"%m-%d-%Y\" }],\n    }\n\n    expect(await inferSchema(table)).toEqual(schemaDefault)\n    expect(await inferSchema(table, { monthFirst: true })).toEqual(\n      schemaMonthFirst,\n    )\n  })\n\n  it(\"should infer times with standard format\", async () => {\n    const table = DataFrame({\n      fullTime: [\"14:30:45\", \"08:15:30\", \"23:59:59\"],\n      shortTime: [\"14:30\", \"08:15\", \"23:59\"],\n    }).lazy()\n\n    const schema = {\n      fields: [\n        { name: \"fullTime\", type: \"time\" },\n        { name: \"shortTime\", type: \"time\", format: \"%H:%M\" },\n      ],\n    }\n\n    expect(await inferSchema(table)).toEqual(schema)\n  })\n\n  it(\"should infer times with 12-hour format\", async () => {\n    const table = DataFrame({\n      fullTime: [\"2:30:45 PM\", \"8:15:30 AM\", \"11:59:59 PM\"],\n      shortTime: [\"2:30 PM\", \"8:15 AM\", \"11:59 PM\"],\n    }).lazy()\n\n    const schema = {\n      fields: [\n        { name: \"fullTime\", type: \"time\", format: \"%I:%M:%S %p\" },\n        { name: \"shortTime\", type: \"time\", format: \"%I:%M %p\" },\n      ],\n    }\n\n    expect(await inferSchema(table)).toEqual(schema)\n  })\n\n  it(\"should infer times with timezone offset\", async () => {\n    const table = DataFrame({\n      name: [\"14:30:45+01:00\", \"08:15:30-05:00\", \"23:59:59+00:00\"],\n    }).lazy()\n\n    const schema = {\n      fields: [{ name: \"name\", type: \"time\" }],\n    }\n\n    expect(await inferSchema(table)).toEqual(schema)\n  })\n\n  it(\"should infer datetimes with ISO format\", async () => {\n    const table = DataFrame({\n      standard: [\n        \"2023-01-15T14:30:45\",\n        \"2023-02-20T08:15:30\",\n        \"2023-03-25T23:59:59\",\n      ],\n      utc: [\n        \"2023-01-15T14:30:45Z\",\n        \"2023-02-20T08:15:30Z\",\n        \"2023-03-25T23:59:59Z\",\n      ],\n      withTz: [\n        \"2023-01-15T14:30:45+01:00\",\n        \"2023-02-20T08:15:30-05:00\",\n        \"2023-03-25T23:59:59+00:00\",\n      ],\n      withSpace: [\n        \"2023-01-15 14:30:45\",\n        \"2023-02-20 08:15:30\",\n        \"2023-03-25 23:59:59\",\n      ],\n    }).lazy()\n\n    const schema = {\n      fields: [\n        { name: \"standard\", type: \"datetime\" },\n        { name: \"utc\", type: \"datetime\" },\n        { name: \"withTz\", type: \"datetime\" },\n        { name: \"withSpace\", type: \"datetime\", format: \"%Y-%m-%d %H:%M:%S\" },\n      ],\n    }\n\n    expect(await inferSchema(table)).toEqual(schema)\n  })\n\n  it(\"should infer datetimes with custom formats\", async () => {\n    const table = DataFrame({\n      shortDayMonth: [\n        \"15/01/2023 14:30\",\n        \"20/02/2023 08:15\",\n        \"25/03/2023 23:59\",\n      ],\n      fullDayMonth: [\n        \"15/01/2023 14:30:45\",\n        \"20/02/2023 08:15:30\",\n        \"25/03/2023 23:59:59\",\n      ],\n      shortMonthDay: [\n        \"01/15/2023 14:30\",\n        \"02/20/2023 08:15\",\n        \"03/25/2023 23:59\",\n      ],\n      fullMonthDay: [\n        \"01/15/2023 14:30:45\",\n        \"02/20/2023 08:15:30\",\n        \"03/25/2023 23:59:59\",\n      ],\n    }).lazy()\n\n    const schemaDefault = {\n      fields: [\n        { name: \"shortDayMonth\", type: \"datetime\", format: \"%d/%m/%Y %H:%M\" },\n        { name: \"fullDayMonth\", type: \"datetime\", format: \"%d/%m/%Y %H:%M:%S\" },\n        { name: \"shortMonthDay\", type: \"datetime\", format: \"%d/%m/%Y %H:%M\" },\n        { name: \"fullMonthDay\", type: \"datetime\", format: \"%d/%m/%Y %H:%M:%S\" },\n      ],\n    }\n\n    const schemaMonthFirst = {\n      fields: [\n        { name: \"shortDayMonth\", type: \"datetime\", format: \"%m/%d/%Y %H:%M\" },\n        { name: \"fullDayMonth\", type: \"datetime\", format: \"%m/%d/%Y %H:%M:%S\" },\n        { name: \"shortMonthDay\", type: \"datetime\", format: \"%m/%d/%Y %H:%M\" },\n        { name: \"fullMonthDay\", type: \"datetime\", format: \"%m/%d/%Y %H:%M:%S\" },\n      ],\n    }\n\n    expect(await inferSchema(table)).toEqual(schemaDefault)\n    expect(await inferSchema(table, { monthFirst: true })).toEqual(\n      schemaMonthFirst,\n    )\n  })\n})\n"]}