Skip to content

Commit

Permalink
training data counts
Browse files Browse the repository at this point in the history
  • Loading branch information
sonalgoyal committed Jan 2, 2022
1 parent 6d9e7fb commit 28dc52b
Showing 1 changed file with 2 additions and 0 deletions.
2 changes: 2 additions & 0 deletions core/src/main/java/zingg/Trainer.java
Original file line number Diff line number Diff line change
Expand Up @@ -42,6 +42,8 @@ public void execute() throws ZinggClientException {
tra = tra.cache();
positives = tra.filter(tra.col(ColName.MATCH_FLAG_COL).equalTo(ColValues.MATCH_TYPE_MATCH));
negatives = tra.filter(tra.col(ColName.MATCH_FLAG_COL).equalTo(ColValues.MATCH_TYPE_NOT_A_MATCH));
LOG.warn("Training on positive pairs - " + positives.count());
LOG.warn("Training on negative pairs - " + negatives.count());

Dataset<Row> testData = PipeUtil.read(spark, true, args.getNumPartitions(), false, args.getData());
Tree<Canopy> blockingTree = BlockingTreeUtil.createBlockingTreeFromSample(testData, positives, 0.5,
Expand Down

0 comments on commit 28dc52b

Please sign in to comment.