-
Notifications
You must be signed in to change notification settings - Fork 0
/
syllable.rb
52 lines (44 loc) · 955 Bytes
/
syllable.rb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
# encoding: utf-8
require 'MeCab'
require 'mecab-modern'
module MeCab
class Node
def part
surface
end
def kana
feature.split(/,/)[8]
end
end
class Syllable
def initialize(text)
@syllables = split(text)
end
def count
@syllables.flatten.size
end
private
def split(text)
mecab = MeCab::Tagger.new
nodes = mecab.parseToNode(text)
syllables = []
nodes.each do |node|
part = node.part
next if part.empty?
kana = node.kana
if kana
syllables << select_syllable(kana)
else
syllables << select_syllable(part)
end
end
syllables
end
def select_syllable(kana)
hiragana_to_katakana(kana).gsub(/[^アイウエオカ-モヤユヨラ-ロワヲンヴー]/, "").split(//)
end
def hiragana_to_katakana(hiragana)
hiragana.tr("ぁ-ゔ","ァ-ヴ")
end
end
end