datapilot-cli
Version:
Enterprise-grade streaming multi-format data analysis with comprehensive statistical insights and intelligent relationship detection - supports CSV, JSON, Excel, TSV, Parquet - memory-efficient, cross-platform
43 lines • 1.58 kB
TypeScript
/**
* Section 5: Data Engineering & Structural Insights Analyzer (Fixed Version)
* Simplified implementation that works with current data structures
*/
import type { Section1Result } from '../overview/types';
import type { Section2Result } from '../quality/types';
import type { Section3Result } from '../eda/types';
import type { Section5Result, Section5Config, Section5Progress } from './types';
export declare class Section5Analyzer {
private config;
private warnings;
private startTime;
constructor(config?: Partial<Section5Config>);
/**
* Main analysis method
*/
analyze(section1Result: Section1Result, section2Result: Section2Result, section3Result: Section3Result, progressCallback?: (progress: Section5Progress) => void): Section5Result;
private generateSimplifiedAnalysis;
private generateSimpleDDL;
private standardizeColumnName;
/**
* Infer appropriate database type based on column name and characteristics
*/
private inferDatabaseType;
/**
* Extract PCA insights from Section 3 results for feature engineering
*/
private extractPCAInsights;
/**
* Calculate enhanced ML readiness score incorporating PCA insights
*/
private calculateEnhancedMLReadinessScore;
/**
* Enhance feature preparation matrix with PCA insights
*/
private enhanceFeatureMatrix;
/**
* Extract actual sample values from Section 1 data preview
*/
private extractSampleValues;
private reportProgress;
}
//# sourceMappingURL=section5-analyzer-fixed.d.ts.map