Skip to content

Commit de40f95

Browse files
authored
feat(lib): Populate feature and labels in user provided order (#217)
BREAKING CHANGE: Previously column order in the CSV file was preserved, this is no longer the case, therefore changing the output.
1 parent 93c9296 commit de40f95

File tree

3 files changed

+35
-14
lines changed

3 files changed

+35
-14
lines changed

src/filterColumns.ts

+23-5
Original file line numberDiff line numberDiff line change
@@ -1,12 +1,30 @@
11
import { CsvTable } from './loadCsv.models';
22

3-
const filterColumns = (table: CsvTable, columnNames: string[]) => {
4-
const indexKeepDecisions = table[0].map(
5-
(header) => columnNames.indexOf(header as string) > -1
3+
/**
4+
* Filters and re-orders columns in a given CSV table.
5+
*
6+
* Where n is the number of non-header cells in `table`, `m` is the number of header cells in `table`, and h is the number of items in `headers`
7+
*
8+
* Time complexity: O(n + mh)
9+
*
10+
* Space complexity: O(n + m + h)
11+
*/
12+
const filterColumns = (table: CsvTable, headers: string[]) => {
13+
const indexKeepDecisions = table[0].map((columnName) =>
14+
headers.includes(columnName as string)
615
);
7-
return table.map((row) =>
8-
row.filter((_, index) => indexKeepDecisions[index])
16+
const filteredColumnNames = table[0].filter((_, i) => indexKeepDecisions[i]);
17+
const indexMap = filteredColumnNames.map((columnName) =>
18+
headers.indexOf(columnName as string)
919
);
20+
return table.map((row) => {
21+
const newRow = new Array(indexMap.length);
22+
for (let i = 0, j = 0; i < row.length; i++) {
23+
if (!indexKeepDecisions[i]) continue;
24+
newRow[indexMap[j++]] = row[i];
25+
}
26+
return newRow;
27+
});
1028
};
1129

1230
export default filterColumns;

src/loadCsv.ts

+5-2
Original file line numberDiff line numberDiff line change
@@ -45,15 +45,18 @@ const loadCsv = (
4545
throw new Error('CSV file can not be shorter than two rows');
4646
}
4747

48-
applyMappings(data, mappings, new Set(flatten));
49-
5048
const tables: { [key: string]: CsvTable } = {
5149
labels: filterColumns(data, labelColumns),
5250
features: filterColumns(data, featureColumns),
5351
testFeatures: [],
5452
testLabels: [],
5553
};
5654

55+
const flattenSet = new Set(flatten);
56+
57+
applyMappings(tables.labels, mappings, flattenSet);
58+
applyMappings(tables.features, mappings, flattenSet);
59+
5760
tables.labels.shift();
5861
const featureColumnNames = tables.features.shift() as string[];
5962

tests/filterColumns.test.ts

+7-7
Original file line numberDiff line numberDiff line change
@@ -2,20 +2,20 @@ import filterColumns from '../src/filterColumns';
22

33
const data = [
44
['lat', 'lng', 'country'],
5-
['0.234', '1.47', 'SomeCountria'],
6-
['-293.2', '103.34', 'SomeOtherCountria'],
5+
['0', '1.47', 'SomeCountria'],
6+
['1', '103.34', 'SomeOtherCountria'],
77
];
88

99
test('Filtering a single column works correctly', () => {
1010
const result = filterColumns(data, ['lng']);
1111
expect(result).toMatchObject([['lng'], ['1.47'], ['103.34']]);
1212
});
1313

14-
test('Filtering multiple columns works correctly', () => {
15-
const result = filterColumns(data, ['country', 'lng']); // Column order from the CSV should be preserved.
14+
test('Filtering multiple columns works correctly, respects order in second argument, does not break with multiple same name columns', () => {
15+
const result = filterColumns(data, ['country', 'lat']); // Column order from the CSV should be preserved.
1616
expect(result).toMatchObject([
17-
['lng', 'country'],
18-
['1.47', 'SomeCountria'],
19-
['103.34', 'SomeOtherCountria'],
17+
['country', 'lat'],
18+
['SomeCountria', '0'],
19+
['SomeOtherCountria', '1'],
2020
]);
2121
});

0 commit comments

Comments
 (0)