From 1882ef669811cebbc1d9b04a75d2ed59a3d5e67d Mon Sep 17 00:00:00 2001 From: chen <15651730270@163.com> Date: Fri, 19 Nov 2021 14:06:54 +0800 Subject: [PATCH 1/2] Update run_ner_crf.py MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit python logging not support 冒号:symbol --- pytorch_version/run_ner_crf.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pytorch_version/run_ner_crf.py b/pytorch_version/run_ner_crf.py index 7e5bdac..55fb808 100755 --- a/pytorch_version/run_ner_crf.py +++ b/pytorch_version/run_ner_crf.py @@ -375,7 +375,7 @@ def main(): args.output_dir = args.output_dir + '{}'.format(args.model_type) if not os.path.exists(args.output_dir): os.mkdir(args.output_dir) - time_ = time.strftime("%Y-%m-%d-%H:%M:%S", time.localtime()) + time_ = time.strftime("%Y-%m-%d-%H-%M-%S", time.localtime()) init_logger(log_file=args.output_dir + f'/{args.model_type}-{args.task_name}-{time_}.log') if os.path.exists(args.output_dir) and os.listdir( args.output_dir) and args.do_train and not args.overwrite_output_dir: From f5e948958b20010e765cc80f8f71c9a720c8a16e Mon Sep 17 00:00:00 2001 From: chen <15651730270@163.com> Date: Fri, 19 Nov 2021 14:07:56 +0800 Subject: [PATCH 2/2] Update utils_ner.py MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit support 中文 train.json --- pytorch_version/processors/utils_ner.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/pytorch_version/processors/utils_ner.py b/pytorch_version/processors/utils_ner.py index 01f024b..6ea1fb4 100755 --- a/pytorch_version/processors/utils_ner.py +++ b/pytorch_version/processors/utils_ner.py @@ -48,7 +48,7 @@ def _read_tsv(cls, input_file, quotechar=None): @classmethod def _read_text(self,input_file): lines = [] - with open(input_file,'r') as f: + with open(input_file, 'r', encoding="utf-8") as f: words = [] labels = [] for line in f: