summaryrefslogtreecommitdiff
path: root/src/tools/analysis/core.ts
blob: 20e5fa6c5167c03e2aa72e5e23fe8215326c85bb (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
const bayes = require('./naive-bayes.js');

const MeCab = require('./mecab');
import Post from '../../api/models/post';

/**
 * 投稿を学習したり与えられた投稿のカテゴリを予測します
 */
export default class Categorizer {
	private classifier: any;
	private mecab: any;

	constructor() {
		this.mecab = new MeCab();

		// BIND -----------------------------------
		this.tokenizer = this.tokenizer.bind(this);
	}

	private tokenizer(text: string) {
		const tokens = this.mecab.parseSync(text)
			// 名詞だけに制限
			.filter(token => token[1] === '名詞')
			// 取り出し
			.map(token => token[0]);

		return tokens;
	}

	public async init() {
		this.classifier = bayes({
			tokenizer: this.tokenizer
		});

		// 訓練データ取得
		const verifiedPosts = await Post.find({
			is_category_verified: true
		});

		// 学習
		verifiedPosts.forEach(post => {
			this.classifier.learn(post.text, post.category);
		});
	}

	public async predict(text) {
		return this.classifier.categorize(text);
	}
}