This repository has been archived on 2024-07-22. You can view files and clone it, but cannot push or open issues or pull requests.
Zaimki/server/pesel.js

160 lines
5.4 KiB
JavaScript
Raw Permalink Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

const Papa = require('papaparse');
const fs = require('fs');
const loadTsv = name => Papa.parse(fs.readFileSync(name).toString(), {
dynamicTyping: true,
header: true,
skipEmptyLines: true,
delimiter: '\t',
}).data;
const _each = (obj, callable) => {
const ret = [];
for (let key in obj) {
if (obj.hasOwnProperty(key)) {
ret.push(callable(obj[key], key));
}
}
return ret;
};
const peselK1 = loadTsv('./data/names/K1.tsv');
const peselK2 = loadTsv('./data/names/K2.tsv');
const peselM1 = loadTsv('./data/names/M1.tsv');
const peselM2 = loadTsv('./data/names/M2.tsv');
const pesel = {}
for (let [names, sex, ordinal] of [
[peselK1, 'K', 1],
[peselK2, 'K', 2],
[peselM1, 'M', 1],
[peselM2, 'M', 2],
]) {
for (let {name, count} of names) {
if (pesel[name] === undefined) {
pesel[name] = {K: [0, 0], M: [0, 0]};
}
pesel[name][sex][ordinal - 1] = count;
}
}
const calculateBalance = (k, m) => {
const balance = k / (k + m);
return balance > 0.5
? 1 - balance
: balance;
}
const allUnisex = {};
const popularUnisex = {};
const allFirstUnisex = {};
const popularFirstUnisex = {};
_each(pesel, (counts, name) => {
counts['balanceBoth'] = calculateBalance(counts.K[0] + counts.K[1], counts.M[0] + counts.M[1]);
counts['balanceFirst'] = calculateBalance(counts.K[0], counts.M[0]);
counts['balanceBothPop'] = counts['balanceBoth'] * (counts.K[0] + counts.K[1] + counts.M[0] + counts.M[1]);
counts['balanceFirstPop'] = counts['balanceFirst'] * (counts.K[0] + counts.M[0]);
});
let maxBalanceBoth = {balance: 0, name: ''};
let maxBalanceBothPop = {balance: 0, name: ''};
let maxBalanceFirst = {balance: 0, name: ''};
let maxBalanceFirstPop = {balance: 0, name: ''};
const popularMin = 100;
_each(pesel, (counts, name) => {
if (counts.K[0] + counts.K[1] > 0 && counts.M[0] + counts.M[1] > 0) {
allUnisex[name] = counts;
}
if (counts.K[0] + counts.K[1] >= popularMin && counts.M[0] + counts.M[1] >= popularMin) {
popularUnisex[name] = counts;
if (counts['balanceBoth'] > maxBalanceBoth.balance) {
maxBalanceBoth = {balance: counts['balanceBoth'], name: name};
}
}
if (counts['balanceBothPop'] > maxBalanceBothPop.balance) {
maxBalanceBothPop = {balance: counts['balanceBothPop'], name: name};
}
if (counts.K[0] > 0 && counts.M[0] > 0) {
allFirstUnisex[name] = counts;
}
if (counts.K[0] >= popularMin && counts.M[0] >= popularMin) {
popularFirstUnisex[name] = counts;
if (counts['balanceFirst'] > maxBalanceFirst.balance) {
maxBalanceFirst = {balance: counts['balanceFirst'], name: name};
}
}
if (counts['balanceFirstPop'] > maxBalanceFirstPop.balance) {
maxBalanceFirstPop = {balance: counts['balanceFirstPop'], name: name};
}
});
const buildTable = (names, both, sortBy) => {
names = _each(names, (counts, name) => { return {name, counts} }).sort((a, b) => {
return b.counts[sortBy] - a.counts[sortBy];
})
let table = `<div class="table-wide table-responsive"><table class="table table-sm table-striped"><tr class="sticky-top">`;
table += `<th data-sort><span class="fal fa-signature"></span> Imię</th>`;
table += `<th data-sort="number"><span class="fal fa-venus"></span> Kobiety${both ? ' <small>(pierwsze imię)' : ''}</small></th>`;
if (both) {
table += `<th data-sort="number"><span class="fal fa-venus"></span> Kobiety <small>(drugie imię)</small></th>`;
}
table += `<th data-sort="number"><span class="fal fa-mars"></span> Mężczyźni${both ? ' <small>(pierwsze imię)' : ''}</th>`;
if (both) {
table += `<th data-sort="number"><span class="fal fa-mars"></span> Mężczyźni <small>(drugie imię)</small></th>`;
}
table += `<th data-sort="number"><span class="fal fa-balance-scale"></span> Balans</th>`;
table += `<th data-sort="number" data-sort-auto="desc"><span class="fal fa-trophy"></span> Balans × popularność</th>`;
table += `</tr>`;
for (let {name, counts} of names) {
table += `<tr>`;
table += `<td>${name}</td>`;
table += `<td>${counts.K[0]}</td>`;
if (both) {
table += `<td>${counts.K[1]}</td>`;
}
table += `<td>${counts.M[0]}</td>`;
if (both) {
table += `<td>${counts.M[1]}</td>`;
}
table += `<td>${counts[both ? 'balanceBoth' : 'balanceFirst'].toFixed(3)}</td>`;
table += `<td>${counts[both ? 'balanceBothPop' : 'balanceFirstPop'].toFixed(0)}</td>`;
table += `</tr>`;
}
table += `</table ></div>`;
return table;
}
const buildList = (names) => {
return Object.keys(names).sort().join(', ');
}
console.log('Oba imiona:')
console.log(Object.keys(allUnisex).length);
console.log(buildList(allUnisex));
console.log(Object.keys(popularUnisex).length);
console.log(buildTable(popularUnisex, true, 'balanceBothPop'))
console.log('Max balans', maxBalanceBoth, maxBalanceBothPop)
// console.log(popularUnisex);
console.log('Pierwsze imiona:')
console.log(Object.keys(allFirstUnisex).length);
console.log(buildList(allFirstUnisex));
console.log(Object.keys(popularFirstUnisex).length);
console.log(buildTable(popularFirstUnisex, false, 'balanceFirstPop'))
console.log('Max balans', maxBalanceFirst, maxBalanceFirstPop)
// console.log(popularFirstUnisex);
console.log(allUnisex['ALEX'])
console.log(allUnisex['ALEKS'])