Skip to content

Commit

Permalink
Merge pull request #62 from farthur/master
Browse files Browse the repository at this point in the history
Debug Dummifier transform and add parameters seq_len to Bert model
  • Loading branch information
farthur committed Oct 7, 2020
2 parents a876d32 + 14240ca commit baf644f
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 1 deletion.
2 changes: 1 addition & 1 deletion melusine/models/train.py
Original file line number Diff line number Diff line change
Expand Up @@ -422,7 +422,7 @@ def _prepare_bert_sequences(self, X):
else:
sequence = X["clean_text"].values.tolist()
seqs = self.tokenizer.batch_encode_plus(
sequence, max_length=100, pad_to_max_length=True
sequence, max_length=self.seq_size, pad_to_max_length=True
)

return (
Expand Down
1 change: 1 addition & 0 deletions melusine/prepare_email/metadata_engineering.py
Original file line number Diff line number Diff line change
Expand Up @@ -246,4 +246,5 @@ def transform(self, X, y=None):
X_ = X_.T.reindex(self.dummy_features).T.fillna(0)
return X_[self.dummy_features].to_dict(orient="records")[0]
else:
X_ = X_.T.reindex(self.dummy_features).T.fillna(0)
return X_[self.dummy_features]

0 comments on commit baf644f

Please sign in to comment.