gadm-ts/dist/names.js
2026-03-23 17:35:02 +01:00

170 lines
15 KiB
JavaScript

/**
* Names lookup — port of Python pygadm.Names class.
*
* Searches the GADM parquet database for admin areas by name or GID code.
* Returns matching rows with NAME_{level} and GID_{level} columns.
*/
import { loadDatabase } from './database.js';
// ---------- helpers ----------
/** Simple Levenshtein distance for fuzzy matching */
function levenshtein(a, b) {
const m = a.length, n = b.length;
const dp = Array.from({ length: m + 1 }, () => Array(n + 1).fill(0));
for (let i = 0; i <= m; i++)
dp[i][0] = i;
for (let j = 0; j <= n; j++)
dp[0][j] = j;
for (let i = 1; i <= m; i++) {
for (let j = 1; j <= n; j++) {
dp[i][j] = a[i - 1] === b[j - 1]
? dp[i - 1][j - 1]
: 1 + Math.min(dp[i - 1][j], dp[i][j - 1], dp[i - 1][j - 1]);
}
}
return dp[m][n];
}
/** Find the N closest matches to `query` from a list of candidates */
function closestMatches(query, candidates, n = 5) {
const q = query.toLowerCase();
const scored = candidates.map(c => ({ val: c, dist: levenshtein(q, c.toLowerCase()) }));
scored.sort((a, b) => a.dist - b.dist);
return scored.slice(0, n).map(s => s.val);
}
// ---------- main function ----------
/**
* Look up administrative area names/codes in the GADM database.
*
* Port of Python `pygadm.Names(name, admin, content_level, complete)`.
*/
export async function getNames(opts = {}) {
const { name, admin, contentLevel: rawContentLevel = -1, complete = false } = opts;
if (name && admin) {
throw new Error('"name" and "admin" cannot be set at the same time.');
}
const db = await loadDatabase();
let contentLevel = rawContentLevel;
if (name || admin) {
const isName = !!name;
const id = (name || admin);
const colPrefix = isName ? 'NAME_' : 'GID_';
// Search all 6 levels for the id
const matchedLevel = findLevel(db, colPrefix, id);
if (matchedLevel === -1) {
// Not found — suggest closest matches
const allIds = collectAllIds(db, colPrefix);
const close = closestMatches(id, allIds, 5);
const formatted = isName
? close.map(c => capitalize(c))
: close.map(c => c.toUpperCase());
throw new Error(`The requested "${id}" is not part of GADM. ` +
`The closest matches are: ${formatted.join(', ')}.`);
}
const level = matchedLevel;
// Filter to rows matching this id at the found level
const col = `${colPrefix}${level}`;
let subDf = db.filter(r => caseEqual(r[col], id));
// Find max available level in this subset
const maxLevel = findMaxLevel(subDf);
// Resolve content level
if (contentLevel === -1) {
contentLevel = level;
}
else if (contentLevel < level) {
// Requested level higher than area — fallback
contentLevel = level;
}
if (contentLevel > maxLevel) {
contentLevel = maxLevel;
}
// Deduplicate at content level
const nameCol = `NAME_${contentLevel}`;
const gidCol = `GID_${contentLevel}`;
const seen = new Set();
subDf = subDf.filter(r => {
if (!r[nameCol])
return false; // skip empty
const key = `${r[nameCol]}|${r[gidCol]}`;
if (seen.has(key))
return false;
seen.add(key);
return true;
});
// Select columns
const columns = complete
? ['NAME_0', 'GID_0', 'NAME_1', 'GID_1', 'NAME_2', 'GID_2', 'NAME_3', 'GID_3', 'NAME_4', 'GID_4', 'NAME_5', 'GID_5']
.filter((_, i) => Math.floor(i / 2) <= contentLevel)
: [nameCol, gidCol];
const rows = complete ? subDf : subDf.map(r => {
const out = {};
for (const c of columns)
out[c] = r[c] ?? '';
return out;
});
return { rows, level: contentLevel, columns };
}
// No name/admin — return world-level data
contentLevel = contentLevel === -1 ? 0 : contentLevel;
const nameCol = `NAME_${contentLevel}`;
const gidCol = `GID_${contentLevel}`;
const seen = new Set();
const rows = db.filter(r => {
if (!r[nameCol])
return false;
const key = `${r[nameCol]}|${r[gidCol]}`;
if (seen.has(key))
return false;
seen.add(key);
return true;
});
const columns = [nameCol, gidCol];
const filtered = rows.map(r => {
const out = {};
for (const c of columns)
out[c] = r[c] ?? '';
return out;
});
return { rows: filtered, level: contentLevel, columns };
}
// ---------- internal helpers ----------
function caseEqual(a, b) {
if (!a)
return false;
return a.toLowerCase() === b.toLowerCase();
}
function capitalize(s) {
return s.charAt(0).toUpperCase() + s.slice(1);
}
/** Find which level (0-5) contains the given id */
function findLevel(db, colPrefix, id) {
const idLower = id.toLowerCase();
for (let level = 0; level < 6; level++) {
const col = `${colPrefix}${level}`;
if (db.some(r => r[col]?.toLowerCase() === idLower)) {
return level;
}
}
return -1;
}
/** Collect all unique ids across all levels for fuzzy matching */
function collectAllIds(db, colPrefix) {
const ids = new Set();
for (let level = 0; level < 6; level++) {
const col = `${colPrefix}${level}`;
for (const r of db) {
if (r[col])
ids.add(r[col].toLowerCase());
}
}
return [...ids];
}
/** Find the maximum level that has non-empty data */
function findMaxLevel(rows) {
for (let level = 5; level >= 0; level--) {
const col = `GID_${level}`;
if (rows.some(r => r[col] && r[col] !== '')) {
return level;
}
}
return 0;
}
//# sourceMappingURL=data:application/json;base64,{"version":3,"file":"names.js","sourceRoot":"","sources":["../src/names.ts"],"names":[],"mappings":"AAAA;;;;;GAKG;AACH,OAAO,EAAE,YAAY,EAAgB,MAAM,eAAe,CAAC;AAwB3D,gCAAgC;AAEhC,qDAAqD;AACrD,SAAS,WAAW,CAAC,CAAS,EAAE,CAAS;IACrC,MAAM,CAAC,GAAG,CAAC,CAAC,MAAM,EAAE,CAAC,GAAG,CAAC,CAAC,MAAM,CAAC;IACjC,MAAM,EAAE,GAAe,KAAK,CAAC,IAAI,CAAC,EAAE,MAAM,EAAE,CAAC,GAAG,CAAC,EAAE,EAAE,GAAG,EAAE,CAAC,KAAK,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,IAAI,CAAC,CAAC,CAAC,CAAC,CAAC;IACjF,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC,EAAE;QAAE,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;IAC1C,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC,EAAE;QAAE,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;IAC1C,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC;QAC1B,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC;YAC1B,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;gBAC5B,CAAC,CAAC,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;gBAClB,CAAC,CAAC,CAAC,GAAG,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;QACrE,CAAC;IACL,CAAC;IACD,OAAO,EAAE,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;AACpB,CAAC;AAED,sEAAsE;AACtE,SAAS,cAAc,CAAC,KAAa,EAAE,UAAoB,EAAE,CAAC,GAAG,CAAC;IAC9D,MAAM,CAAC,GAAG,KAAK,CAAC,WAAW,EAAE,CAAC;IAC9B,MAAM,MAAM,GAAG,UAAU,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,EAAE,GAAG,EAAE,CAAC,EAAE,IAAI,EAAE,WAAW,CAAC,CAAC,EAAE,CAAC,CAAC,WAAW,EAAE,CAAC,EAAE,CAAC,CAAC,CAAC;IACxF,MAAM,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,IAAI,GAAG,CAAC,CAAC,IAAI,CAAC,CAAC;IACvC,OAAO,MAAM,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC;AAC9C,CAAC;AAED,sCAAsC;AAEtC;;;;GAIG;AACH,MAAM,CAAC,KAAK,UAAU,QAAQ,CAAC,OAAqB,EAAE;IAClD,MAAM,EAAE,IAAI,EAAE,KAAK,EAAE,YAAY,EAAE,eAAe,GAAG,CAAC,CAAC,EAAE,QAAQ,GAAG,KAAK,EAAE,GAAG,IAAI,CAAC;IAEnF,IAAI,IAAI,IAAI,KAAK,EAAE,CAAC;QAChB,MAAM,IAAI,KAAK,CAAC,oDAAoD,CAAC,CAAC;IAC1E,CAAC;IAED,MAAM,EAAE,GAAG,MAAM,YAAY,EAAE,CAAC;IAChC,IAAI,YAAY,GAAG,eAAe,CAAC;IAEnC,IAAI,IAAI,IAAI,KAAK,EAAE,CAAC;QAChB,MAAM,MAAM,GAAG,CAAC,CAAC,IAAI,CAAC;QACtB,MAAM,EAAE,GAAG,CAAC,IAAI,IAAI,KAAK,CAAE,CAAC;QAC5B,MAAM,SAAS,GAAG,MAAM,CAAC,CAAC,CAAC,OAAO,CAAC,CAAC,CAAC,MAAM,CAAC;QAE5C,iCAAiC;QACjC,MAAM,YAAY,GAAG,SAAS,CAAC,EAAE,EAAE,SAAS,EAAE,EAAE,CAAC,CAAC;QAElD,IAAI,YAAY,KAAK,CAAC,CAAC,EAAE,CAAC;YACtB,sCAAsC;YACtC,MAAM,MAAM,GAAG,aAAa,CAAC,EAAE,EAAE,SAAS,CAAC,CAAC;YAC5C,MAAM,KAAK,GAAG,cAAc,CAAC,EAAE,EAAE,MAAM,EAAE,CAAC,CAAC,CAAC;YAC5C,MAAM,SAAS,GAAG,MAAM;gBACpB,CAAC,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;gBAC/B,CAAC,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,WAAW,EAAE,CAAC,CAAC;YACtC,MAAM,IAAI,KAAK,CACX,kBAAkB,EAAE,yBAAyB;gBAC7C,4BAA4B,SAAS,CAAC,IAAI,CAAC,IAAI,CAAC,GAAG,CACtD,CAAC;QACN,CAAC;QAED,MAAM,KAAK,GAAG,YAAY,CAAC;QAE3B,qDAAqD;QACrD,MAAM,GAAG,GAAG,GAAG,SAAS,GAAG,KAAK,EAAE,CAAC;QACnC,IAAI,KAAK,GAAG,EAAE,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,SAAS,CAAC,CAAC,CAAC,GAAG,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC;QAElD,0CAA0C;QAC1C,MAAM,QAAQ,GAAG,YAAY,CAAC,KAAK,CAAC,CAAC;QAErC,wBAAwB;QACxB,IAAI,YAAY,KAAK,CAAC,CAAC,EAAE,CAAC;YACtB,YAAY,GAAG,KAAK,CAAC;QACzB,CAAC;aAAM,IAAI,YAAY,GAAG,KAAK,EAAE,CAAC;YAC9B,8CAA8C;YAC9C,YAAY,GAAG,KAAK,CAAC;QACzB,CAAC;QACD,IAAI,YAAY,GAAG,QAAQ,EAAE,CAAC;YAC1B,YAAY,GAAG,QAAQ,CAAC;QAC5B,CAAC;QAED,+BAA+B;QAC/B,MAAM,OAAO,GAAG,QAAQ,YAAY,EAAE,CAAC;QACvC,MAAM,MAAM,GAAG,OAAO,YAAY,EAAE,CAAC;QACrC,MAAM,IAAI,GAAG,IAAI,GAAG,EAAU,CAAC;QAC/B,KAAK,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE;YACrB,IAAI,CAAC,CAAC,CAAC,OAAO,CAAC;gBAAE,OAAO,KAAK,CAAC,CAAC,aAAa;YAC5C,MAAM,GAAG,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC,MAAM,CAAC,EAAE,CAAC;YACzC,IAAI,IAAI,CAAC,GAAG,CAAC,GAAG,CAAC;gBAAE,OAAO,KAAK,CAAC;YAChC,IAAI,CAAC,GAAG,CAAC,GAAG,CAAC,CAAC;YACd,OAAO,IAAI,CAAC;QAChB,CAAC,CAAC,CAAC;QAEH,iBAAiB;QACjB,MAAM,OAAO,GAAG,QAAQ;YACpB,CAAC,CAAC,CAAC,QAAQ,EAAE,OAAO,EAAE,QAAQ,EAAE,OAAO,EAAE,QAAQ,EAAE,OAAO,EAAE,QAAQ,EAAE,OAAO,EAAE,QAAQ,EAAE,OAAO,EAAE,QAAQ,EAAE,OAAO,CAAC;iBAC/G,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,EAAE,EAAE,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC,GAAG,CAAC,CAAC,IAAI,YAAY,CAAC;YACxD,CAAC,CAAC,CAAC,OAAO,EAAE,MAAM,CAAC,CAAC;QAExB,MAAM,IAAI,GAAG,QAAQ,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE;YAC1C,MAAM,GAAG,GAAY,EAAE,CAAC;YACxB,KAAK,MAAM,CAAC,IAAI,OAAO;gBAAE,GAAG,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC;YAC7C,OAAO,GAAG,CAAC;QACf,CAAC,CAAC,CAAC;QAEH,OAAO,EAAE,IAAI,EAAE,KAAK,EAAE,YAAY,EAAE,OAAO,EAAE,CAAC;IAClD,CAAC;IAED,0CAA0C;IAC1C,YAAY,GAAG,YAAY,KAAK,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,YAAY,CAAC;IACtD,MAAM,OAAO,GAAG,QAAQ,YAAY,EAAE,CAAC;IACvC,MAAM,MAAM,GAAG,OAAO,YAAY,EAAE,CAAC;IAErC,MAAM,IAAI,GAAG,IAAI,GAAG,EAAU,CAAC;IAC/B,MAAM,IAAI,GAAG,EAAE,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE;QACvB,IAAI,CAAC,CAAC,CAAC,OAAO,CAAC;YAAE,OAAO,KAAK,CAAC;QAC9B,MAAM,GAAG,GAAG,GAAG,CAAC,CAAC,OAAO,CAAC,IAAI,CAAC,CAAC,MAAM,CAAC,EAAE,CAAC;QACzC,IAAI,IAAI,CAAC,GAAG,CAAC,GAAG,CAAC;YAAE,OAAO,KAAK,CAAC;QAChC,IAAI,CAAC,GAAG,CAAC,GAAG,CAAC,CAAC;QACd,OAAO,IAAI,CAAC;IAChB,CAAC,CAAC,CAAC;IAEH,MAAM,OAAO,GAAG,CAAC,OAAO,EAAE,MAAM,CAAC,CAAC;IAClC,MAAM,QAAQ,GAAG,IAAI,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE;QAC1B,MAAM,GAAG,GAAY,EAAE,CAAC;QACxB,KAAK,MAAM,CAAC,IAAI,OAAO;YAAE,GAAG,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,IAAI,EAAE,CAAC;QAC7C,OAAO,GAAG,CAAC;IACf,CAAC,CAAC,CAAC;IAEH,OAAO,EAAE,IAAI,EAAE,QAAQ,EAAE,KAAK,EAAE,YAAY,EAAE,OAAO,EAAE,CAAC;AAC5D,CAAC;AAED,yCAAyC;AAEzC,SAAS,SAAS,CAAC,CAAqB,EAAE,CAAS;IAC/C,IAAI,CAAC,CAAC;QAAE,OAAO,KAAK,CAAC;IACrB,OAAO,CAAC,CAAC,WAAW,EAAE,KAAK,CAAC,CAAC,WAAW,EAAE,CAAC;AAC/C,CAAC;AAED,SAAS,UAAU,CAAC,CAAS;IACzB,OAAO,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,WAAW,EAAE,GAAG,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;AAClD,CAAC;AAED,mDAAmD;AACnD,SAAS,SAAS,CAAC,EAAa,EAAE,SAAiB,EAAE,EAAU;IAC3D,MAAM,OAAO,GAAG,EAAE,CAAC,WAAW,EAAE,CAAC;IACjC,KAAK,IAAI,KAAK,GAAG,CAAC,EAAE,KAAK,GAAG,CAAC,EAAE,KAAK,EAAE,EAAE,CAAC;QACrC,MAAM,GAAG,GAAG,GAAG,SAAS,GAAG,KAAK,EAAE,CAAC;QACnC,IAAI,EAAE,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,GAAG,CAAC,EAAE,WAAW,EAAE,KAAK,OAAO,CAAC,EAAE,CAAC;YAClD,OAAO,KAAK,CAAC;QACjB,CAAC;IACL,CAAC;IACD,OAAO,CAAC,CAAC,CAAC;AACd,CAAC;AAED,kEAAkE;AAClE,SAAS,aAAa,CAAC,EAAa,EAAE,SAAiB;IACnD,MAAM,GAAG,GAAG,IAAI,GAAG,EAAU,CAAC;IAC9B,KAAK,IAAI,KAAK,GAAG,CAAC,EAAE,KAAK,GAAG,CAAC,EAAE,KAAK,EAAE,EAAE,CAAC;QACrC,MAAM,GAAG,GAAG,GAAG,SAAS,GAAG,KAAK,EAAE,CAAC;QACnC,KAAK,MAAM,CAAC,IAAI,EAAE,EAAE,CAAC;YACjB,IAAI,CAAC,CAAC,GAAG,CAAC;gBAAE,GAAG,CAAC,GAAG,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,WAAW,EAAE,CAAC,CAAC;QAC9C,CAAC;IACL,CAAC;IACD,OAAO,CAAC,GAAG,GAAG,CAAC,CAAC;AACpB,CAAC;AAED,qDAAqD;AACrD,SAAS,YAAY,CAAC,IAAe;IACjC,KAAK,IAAI,KAAK,GAAG,CAAC,EAAE,KAAK,IAAI,CAAC,EAAE,KAAK,EAAE,EAAE,CAAC;QACtC,MAAM,GAAG,GAAG,OAAO,KAAK,EAAE,CAAC;QAC3B,IAAI,IAAI,CAAC,IAAI,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,GAAG,CAAC,IAAI,CAAC,CAAC,GAAG,CAAC,KAAK,EAAE,CAAC,EAAE,CAAC;YAC1C,OAAO,KAAK,CAAC;QACjB,CAAC;IACL,CAAC;IACD,OAAO,CAAC,CAAC;AACb,CAAC"}