forked from dracor-org/einakter
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathyml2csv.ts
79 lines (74 loc) · 2.49 KB
/
yml2csv.ts
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
import {loadAll, CORE_SCHEMA} from 'js-yaml';
import {readFileSync, writeFileSync} from 'fs';
import {Play} from './src/types';
import {
normalizeYear,
getEarliestYear,
countCharactersByGender
} from './src/utils';
let data: Play[] = [];
try {
data = loadAll(readFileSync('./data.yaml', 'utf8'), null, {
schema: CORE_SCHEMA
}) as Play[];
} catch (error) {
console.log(error);
}
const cols = [
'id',
'link', // (the slug, but as clickable link for convenience)
'title',
'subtitle',
'basedOn', // (only true or false, an easy way to exclude translations)
'earliestYear',
'normalizedYear',
'createdYear',
'printedYear',
'premiereYear', // (without day/month for premier dates, only years)
'formalia', // (in one cell, separated by a line break)
'keywords', // (in one cell, separated by a line break)
'wikidataID', // (as full URL to be clickable for convenience)
'dracorID', // (as full URL to be clickable for convenience)
'wegaId',
'locationID', // (as full URL to be clickable for convenience)
'numberOfScenes',
'numberOfCharacters',
'numberOfMaleCharacters',
'numberOfFemaleCharacters',
'numberOfCharactersWithUnknownGender'
];
const lines = data.map((p: Play) => {
const num = countCharactersByGender(p);
const locationId = p.settings?.find(
(s) => s.location?.wikidataId
)?.location.wikidataId;
const play: {[index: string]: any} = {
...p,
normalizedYear: normalizeYear(p),
earliestYear: getEarliestYear(p) || '',
numberOfCharacters: num.total,
numberOfMaleCharacters: num.male,
numberOfFemaleCharacters: num.female,
numberOfCharactersWithUnknownGender: num.unknown,
basedOn: p.basedOn ? 'true' : 'false',
link: `https://einakter.dracor.org/${p.slug}`,
createdYear: p.created,
printedYear: p.printed,
premiereYear: p.premiered ? `${p.premiered}`.split('-')[0] : '',
formalia: p.formalia?.join('\n'),
keywords: p.keywords?.join('\n'),
dracorID: p.ids?.dracor ? `https://dracor.org/id/${p.ids.dracor}` : '',
wegaId: p.ids?.weber ? `http://weber-gesamtausgabe.de/${p.ids.weber}` : '',
wikidataID: p.ids?.wikidata
? `http://wikidata.org/entity/${p.ids.wikidata}` : '',
locationID: locationId
? `http://wikidata.org/entity/${locationId}` : '',
};
const line = cols.map(col => {
const value: string = play[col] || '';
return `"${`${value}`.replace(/"/g, '""')}"`;
}).join(',');
return line;
});
lines.unshift(cols.join(','));
writeFileSync('./data.csv', lines.join('\n'));