更新MS_OUTPUT_SIZE

nl8590687 · Oct 22, 2020 · 024dbcc · 024dbcc
1 parent 053c990
commit 024dbcc
Show file tree

Hide file tree

Showing 11 changed files with 21 additions and 21 deletions.
diff --git a/SpeechModel24.py b/SpeechModel24.py
@@ -28,9 +28,9 @@ class ModelSpeech(): # 语音模型类
 	def __init__(self, datapath):
 		'''
 		初始化
-		默认输出的拼音的表示大小是1424，即1423个拼音+1个空白块
+		默认输出的拼音的表示大小是1428，即1427个拼音+1个空白块
 		'''
-		MS_OUTPUT_SIZE = 1424
+		MS_OUTPUT_SIZE = 1428
 		self.MS_OUTPUT_SIZE = MS_OUTPUT_SIZE # 神经网络最终输出的每一个字符向量维度的大小
 		#self.BATCH_SIZE = BATCH_SIZE # 一次训练的batch
 		self.label_max_string_length = 64

diff --git a/SpeechModel25.py b/SpeechModel25.py
@@ -28,9 +28,9 @@ class ModelSpeech(): # 语音模型类
 	def __init__(self, datapath):
 		'''
 		初始化
-		默认输出的拼音的表示大小是1424，即1423个拼音+1个空白块
+		默认输出的拼音的表示大小是1428，即1427个拼音+1个空白块
 		'''
-		MS_OUTPUT_SIZE = 1424
+		MS_OUTPUT_SIZE = 1428
 		self.MS_OUTPUT_SIZE = MS_OUTPUT_SIZE # 神经网络最终输出的每一个字符向量维度的大小
 		#self.BATCH_SIZE = BATCH_SIZE # 一次训练的batch
 		self.label_max_string_length = 64

diff --git a/SpeechModel251.py b/SpeechModel251.py
@@ -33,9 +33,9 @@ class ModelSpeech(): # 语音模型类
 	def __init__(self, datapath):
 		'''
 		初始化
-		默认输出的拼音的表示大小是1424，即1423个拼音+1个空白块
+		默认输出的拼音的表示大小是1428，即1427个拼音+1个空白块
 		'''
-		MS_OUTPUT_SIZE = 1424
+		MS_OUTPUT_SIZE = 1428
 		self.MS_OUTPUT_SIZE = MS_OUTPUT_SIZE # 神经网络最终输出的每一个字符向量维度的大小
 		#self.BATCH_SIZE = BATCH_SIZE # 一次训练的batch
 		self.label_max_string_length = 64

diff --git a/SpeechModel251_limitless.py b/SpeechModel251_limitless.py
@@ -32,9 +32,9 @@ class ModelSpeech(): # 语音模型类
 	def __init__(self, datapath):
 		'''
 		初始化
-		默认输出的拼音的表示大小是1424，即1423个拼音+1个空白块
+		默认输出的拼音的表示大小是1428，即1427个拼音+1个空白块
 		'''
-		MS_OUTPUT_SIZE = 1424
+		MS_OUTPUT_SIZE = 1428
 		self.MS_OUTPUT_SIZE = MS_OUTPUT_SIZE # 神经网络最终输出的每一个字符向量维度的大小
 		#self.BATCH_SIZE = BATCH_SIZE # 一次训练的batch
 		self.label_max_string_length = 64
@@ -429,7 +429,7 @@ def model(self):
 
 
 	#ms.LoadModel(modelpath + 'm251/speech_model251_e_0_step_100000.model')
-	#ms.TrainModel(datapath, epoch = 50, batch_size = 16, save_step = 500)
+	ms.TrainModel(datapath, epoch = 50, batch_size = 16, save_step = 500)
 
 	#t1=time.time()
 	#ms.TestModel(datapath, str_dataset='train', data_count = 128, out_report = True)

diff --git a/SpeechModel251_p.py b/SpeechModel251_p.py
@@ -32,9 +32,9 @@ class ModelSpeech(): # 语音模型类
 	def __init__(self, datapath):
 		'''
 		初始化
-		默认输出的拼音的表示大小是1424，即1423个拼音+1个空白块
+		默认输出的拼音的表示大小是1428，即1427个拼音+1个空白块
 		'''
-		MS_OUTPUT_SIZE = 1424
+		MS_OUTPUT_SIZE = 1428
 		self.MS_OUTPUT_SIZE = MS_OUTPUT_SIZE # 神经网络最终输出的每一个字符向量维度的大小
 		#self.BATCH_SIZE = BATCH_SIZE # 一次训练的batch
 		self.label_max_string_length = 64

diff --git a/SpeechModel252.py b/SpeechModel252.py
@@ -31,9 +31,9 @@ class ModelSpeech(): # 语音模型类
 	def __init__(self, datapath):
 		'''
 		初始化
-		默认输出的拼音的表示大小是1424，即1423个拼音+1个空白块
+		默认输出的拼音的表示大小是1428，即1427个拼音+1个空白块
 		'''
-		MS_OUTPUT_SIZE = 1424
+		MS_OUTPUT_SIZE = 1428
 		self.MS_OUTPUT_SIZE = MS_OUTPUT_SIZE # 神经网络最终输出的每一个字符向量维度的大小
 		#self.BATCH_SIZE = BATCH_SIZE # 一次训练的batch
 		self.label_max_string_length = 64

diff --git a/SpeechModel26.py b/SpeechModel26.py
@@ -29,9 +29,9 @@ class ModelSpeech(): # 语音模型类
 	def __init__(self, datapath):
 		'''
 		初始化
-		默认输出的拼音的表示大小是1424，即1423个拼音+1个空白块
+		默认输出的拼音的表示大小是1428，即1427个拼音+1个空白块
 		'''
-		MS_OUTPUT_SIZE = 1424
+		MS_OUTPUT_SIZE = 1428
 		self.MS_OUTPUT_SIZE = MS_OUTPUT_SIZE # 神经网络最终输出的每一个字符向量维度的大小
 		#self.BATCH_SIZE = BATCH_SIZE # 一次训练的batch
 		self.label_max_string_length = 64

diff --git a/SpeechModel261.py b/SpeechModel261.py
@@ -33,9 +33,9 @@ class ModelSpeech(): # 语音模型类
 	def __init__(self, datapath):
 		'''
 		初始化
-		默认输出的拼音的表示大小是1422，即1421个拼音+1个空白块
+		默认输出的拼音的表示大小是1428，即1427个拼音+1个空白块
 		'''
-		MS_OUTPUT_SIZE = 1424
+		MS_OUTPUT_SIZE = 1428
 		self.MS_OUTPUT_SIZE = MS_OUTPUT_SIZE # 神经网络最终输出的每一个字符向量维度的大小
 		#self.BATCH_SIZE = BATCH_SIZE # 一次训练的batch
 		self.label_max_string_length = 64

diff --git a/SpeechModel261_p.py b/SpeechModel261_p.py
@@ -33,9 +33,9 @@ class ModelSpeech(): # 语音模型类
 	def __init__(self, datapath):
 		'''
 		初始化
-		默认输出的拼音的表示大小是1422，即1421个拼音+1个空白块
+		默认输出的拼音的表示大小是1428，即1427个拼音+1个空白块
 		'''
-		MS_OUTPUT_SIZE = 1424
+		MS_OUTPUT_SIZE = 1428
 		self.MS_OUTPUT_SIZE = MS_OUTPUT_SIZE # 神经网络最终输出的每一个字符向量维度的大小
 		#self.BATCH_SIZE = BATCH_SIZE # 一次训练的batch
 		self.label_max_string_length = 64

diff --git a/test_mspeech.py b/test_mspeech.py
@@ -34,7 +34,7 @@
 
 system_type = plat.system() # 由于不同的系统的文件路径表示不一样，需要进行判断
 if(system_type == 'Windows'):
-	datapath = 'E:\\语音数据集'
+	datapath = 'D:\\SpeechData'
 	modelpath = modelpath + '\\'
 elif(system_type == 'Linux'):
 	datapath = 'dataset'

diff --git a/train_mspeech.py b/train_mspeech.py
@@ -33,7 +33,7 @@
 
 system_type = plat.system() # 由于不同的系统的文件路径表示不一样，需要进行判断
 if(system_type == 'Windows'):
-	datapath = 'E:\\语音数据集'
+	datapath = 'D:\\SpeechData'
 	modelpath = modelpath + '\\'
 elif(system_type == 'Linux'):
 	datapath = 'dataset'