-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathindex.js
52 lines (42 loc) · 1.24 KB
/
index.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
const path = require('path');
const lunr = require('lunr');
const esql = require('sql-extra');
var corpus = null;
var index = null;
function createIndex() {
return lunr(function() {
this.ref('sno');
this.field('sno');
this.field('state');
this.pipeline.remove(lunr.stopWordFilter);
for (var r of corpus.values())
this.add(r);
});
}
function load() {
if (corpus) return corpus;
corpus = require('./corpus');
index = createIndex();
return corpus;
}
function csv() {
return path.join(__dirname, 'index.csv');
}
function sql(tab='samplingunits', opt={}) {
return esql.setupTable(tab, {sno: 'TEXT', state: 'TEXT', districts: 'INT', selected: 'INT'},
require('./corpus').values(), Object.assign({pk: 'sno', index: true, tsvector: {sno: 'A', state: 'B'}}, opt));
}
function samplingUnits(txt) {
if (!corpus) load();
var a = [], txt = txt.replace(/\W/g, ' ');
var ms = index.search(txt), max = 0;
for (var m of ms)
max = Math.max(max, Object.keys(m.matchData.metadata).length);
for (var m of ms)
if (Object.keys(m.matchData.metadata).length===max) a.push(corpus.get(m.ref));
return a;
}
samplingUnits.load = load;
samplingUnits.csv = csv;
samplingUnits.sql = sql;
module.exports = samplingUnits;