1.0.0 • Published 7 years ago
term-vector v1.0.0
term-vector
A node.js module that creates a term vector from tokenized text. Use term-vector
when implementing a vector space model
Works with Unicode!
Does ngrams!
const tokens = 'this is really really really cool'.split(' ')
// just make a simple term vector
tv(tokens)
// [
// { term: [ 'cool' ], positions: [ 5 ] },
// { term: [ 'is' ], positions: [ 1 ] },
// { term: [ 'really' ], positions: [ 2, 3, 4 ] },
// { term: [ 'this' ], positions: [ 0 ] }
// ]
// make a term vector with ngrams of length 1 and 2
tv(tokens, { ngramLengths: [ 1, 2 ] })
// [
// { term: [ 'cool' ], positions: [ 5 ] },
// { term: [ 'is' ], positions: [ 1 ] },
// { term: [ 'is', 'really' ], positions: [ 1 ] },
// { term: [ 'really' ], positions: [ 2, 3, 4 ] },
// { term: [ 'really', 'really' ], positions: [ 2, 3 ] },
// { term: [ 'really', 'cool' ], positions: [ 4 ] },
// { term: [ 'this' ], positions: [ 0 ] },
// { term: [ 'this', 'is' ], positions: [ 0 ] }
// ]
1.0.0
7 years ago
0.1.2
9 years ago
0.1.1
9 years ago
0.0.18
9 years ago
0.0.17
9 years ago
0.0.16
9 years ago
0.0.15
9 years ago
0.0.14
9 years ago
0.0.13
9 years ago
0.0.12
10 years ago
0.0.11
10 years ago
0.0.10
10 years ago
0.0.9
10 years ago
0.0.8
10 years ago
0.0.7
10 years ago
0.0.6
10 years ago
0.0.5
10 years ago
0.0.4
10 years ago
0.0.3
10 years ago
0.0.2
10 years ago
0.0.1
10 years ago