Skip to content

Commit

Permalink
scripts and config (#389)
Browse files Browse the repository at this point in the history
  • Loading branch information
Eric8932 committed Aug 24, 2023
1 parent a68c3b3 commit d9cbbae
Show file tree
Hide file tree
Showing 10 changed files with 18 additions and 15 deletions.
3 changes: 2 additions & 1 deletion models/sbert/base_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,8 @@
"mask": "fully_visible"
},

"embedding": "dual",
"dropout": 0.1,
"embedding": ["dual"],
"encoder": "dual",
"pooling": "first",
"tie_weights": true
Expand Down
3 changes: 2 additions & 1 deletion models/sbert/large_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,8 @@
"mask": "fully_visible"
},

"embedding": "dual",
"dropout": 0.1,
"embedding": ["dual"],
"encoder": "dual",
"pooling": "first",
"tie_weights": true
Expand Down
3 changes: 2 additions & 1 deletion models/sbert/lstm_config.json
Original file line number Diff line number Diff line change
Expand Up @@ -19,7 +19,8 @@
"encoder": "lstm"
},

"embedding": "dual",
"dropout": 0.1,
"embedding":["dual"],
"encoder": "dual",
"pooling": "mean",
"tie_weights": true
Expand Down
4 changes: 2 additions & 2 deletions scripts/convert_albert_from_huggingface_to_uer.py
Original file line number Diff line number Diff line change
Expand Up @@ -72,7 +72,7 @@
output_model["target.mlm.linear_1.bias"] = input_model["predictions.dense.bias"]
output_model["target.mlm.linear_2.weight"] = input_model["predictions.decoder.weight"]
output_model["target.mlm.linear_2.bias"] = input_model["predictions.bias"]
output_model["target.layer_norm.gamma"] = input_model["predictions.LayerNorm.weight"]
output_model["target.layer_norm.beta"] = input_model["predictions.LayerNorm.bias"]
output_model["target.mlm.layer_norm.gamma"] = input_model["predictions.LayerNorm.weight"]
output_model["target.mlm.layer_norm.beta"] = input_model["predictions.LayerNorm.bias"]

torch.save(output_model, args.output_model_path)
4 changes: 2 additions & 2 deletions scripts/convert_albert_from_original_tf_to_uer.py
Original file line number Diff line number Diff line change
Expand Up @@ -88,8 +88,8 @@ def main():
output_model["target.sp.linear_2.bias"] = input_model["cls/seq_relationship/output_bias"]
output_model["target.mlm.linear_1.weight"] = input_model["cls/predictions/transform/dense/kernel"]
output_model["target.mlm.linear_1.bias"] = input_model["cls/predictions/transform/dense/bias"]
output_model["target.layer_norm.gamma"] = input_model["cls/predictions/transform/LayerNorm/gamma"]
output_model["target.layer_norm.beta"] = input_model["cls/predictions/transform/LayerNorm/beta"]
output_model["target.mlm.layer_norm.gamma"] = input_model["cls/predictions/transform/LayerNorm/gamma"]
output_model["target.mlm.layer_norm.beta"] = input_model["cls/predictions/transform/LayerNorm/beta"]
output_model["target.mlm.linear_2.weight"] = input_model["bert/embeddings/word_embeddings"]
output_model["target.mlm.linear_2.bias"] = input_model["cls/predictions/output_bias"]

Expand Down
4 changes: 2 additions & 2 deletions scripts/convert_albert_from_uer_to_huggingface.py
Original file line number Diff line number Diff line change
Expand Up @@ -67,8 +67,8 @@
output_model["sop_classifier.classifier.bias"] = input_model["target.sp.linear_2.bias"]
output_model["predictions.dense.weight"] = input_model["target.mlm.linear_1.weight"]
output_model["predictions.dense.bias"] = input_model["target.mlm.linear_1.bias"]
output_model["predictions.LayerNorm.weight"] = input_model["target.layer_norm.gamma"]
output_model["predictions.LayerNorm.bias"] = input_model["target.layer_norm.beta"]
output_model["predictions.LayerNorm.weight"] = input_model["target.mlm.layer_norm.gamma"]
output_model["predictions.LayerNorm.bias"] = input_model["target.mlm.layer_norm.beta"]
output_model["predictions.decoder.weight"] = input_model["target.mlm.linear_2.weight"]
output_model["predictions.decoder.bias"] = input_model["target.mlm.linear_2.bias"]
output_model["predictions.bias"] = input_model["target.mlm.linear_2.bias"]
Expand Down
4 changes: 2 additions & 2 deletions scripts/convert_albert_from_uer_to_original_tf.py
Original file line number Diff line number Diff line change
Expand Up @@ -81,8 +81,8 @@ def main():
output_model["cls/seq_relationship/output_bias"] = input_model["target.sp.linear_2.bias"]
output_model["cls/predictions/transform/dense/kernel"] = input_model["target.mlm.linear_1.weight"]
output_model["cls/predictions/transform/dense/bias"] = input_model["target.mlm.linear_1.bias"]
output_model["cls/predictions/transform/LayerNorm/gamma"] = input_model["target.layer_norm.gamma"]
output_model["cls/predictions/transform/LayerNorm/beta"] = input_model["target.layer_norm.beta"]
output_model["cls/predictions/transform/LayerNorm/gamma"] = input_model["target.mlm.layer_norm.gamma"]
output_model["cls/predictions/transform/LayerNorm/beta"] = input_model["target.mlm.layer_norm.beta"]
output_model["bert/embeddings/word_embeddings"] = input_model["target.mlm.linear_2.weight"]
output_model["cls/predictions/output_bias"] = input_model["target.mlm.linear_2.bias"]

Expand Down
2 changes: 1 addition & 1 deletion scripts/extract_embeddings.py
Original file line number Diff line number Diff line change
Expand Up @@ -40,7 +40,7 @@
vocab.load(args.vocab_path)

pretrained_model = torch.load(args.load_model_path)
embedding = pretrained_model["embedding.word_embedding.weight"]
embedding = pretrained_model["embedding.word.embedding.weight"]

with open(args.word_embedding_path, mode="w", encoding="utf-8") as f:
head = str(list(embedding.size())[0]) + " " + str(list(embedding.size())[1]) + "\n"
Expand Down
2 changes: 1 addition & 1 deletion scripts/topn_words_indep.py
Original file line number Diff line number Diff line change
Expand Up @@ -39,7 +39,7 @@
vocab.load(args.vocab_path)

pretrained_model = torch.load(args.load_model_path)
embedding = pretrained_model["embedding.word_embedding.weight"]
embedding = pretrained_model["embedding.word.embedding.weight"]

with open(args.test_path, mode="r", encoding="utf-8") as f:
for line in f:
Expand Down
4 changes: 2 additions & 2 deletions uer/models/model.py
Original file line number Diff line number Diff line change
Expand Up @@ -21,10 +21,10 @@ def __init__(self, args, embedding, encoder, tgt_embedding, decoder, target):

if "mlm" in args.target and args.tie_weights:
self.target.mlm.linear_2.weight = self.embedding.word.embedding.weight
elif "lm" in args.target and args.tie_weights and self.tgt_embedding is not None and "word" in self.tgt_embedding.embedding_name_list:
self.target.lm.output_layer.weight = self.tgt_embedding.word.embedding.weight
elif "lm" in args.target and args.tie_weights and "word" in self.embedding.embedding_name_list:
self.target.lm.output_layer.weight = self.embedding.word.embedding.weight
elif "lm" in args.target and args.tie_weights and "word" in self.tgt_embedding.embedding_name_list:
self.target.lm.output_layer.weight = self.tgt_embedding.word.embedding.weight

if self.decoder is not None and args.share_embedding:
self.tgt_embedding.word.embedding.weight = self.embedding.word.embedding.weight
Expand Down

0 comments on commit d9cbbae

Please sign in to comment.