/
BuildDocumentClassifier.java
71 lines (61 loc) · 3.75 KB
/
BuildDocumentClassifier.java
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
// Copyright (c) Microsoft Corporation. All rights reserved.
// Licensed under the MIT License.
package com.azure.ai.formrecognizer.administration;
import com.azure.ai.formrecognizer.documentanalysis.administration.DocumentModelAdministrationClient;
import com.azure.ai.formrecognizer.documentanalysis.administration.DocumentModelAdministrationClientBuilder;
import com.azure.ai.formrecognizer.documentanalysis.administration.models.BlobContentSource;
import com.azure.ai.formrecognizer.documentanalysis.administration.models.ClassifierDocumentTypeDetails;
import com.azure.ai.formrecognizer.documentanalysis.administration.models.DocumentClassifierDetails;
import com.azure.ai.formrecognizer.documentanalysis.models.OperationResult;
import com.azure.ai.formrecognizer.documentanalysis.administration.models.ContentSource;
import com.azure.core.credential.AzureKeyCredential;
import com.azure.core.util.polling.SyncPoller;
import java.util.HashMap;
/**
* Sample to build a classifier model with training data.
* For instructions on setting up documents for training in an Azure Storage Blob Container, see
* <a href="https://aka.ms/azsdk/formrecognizer/buildclassifiermodel">here</a>.
* <p>
* For this sample, you can use the training documents found in
* <a href="https://aka.ms/azsdk/formrecognizer/sampletrainingfiles">here</a>
* to create your own custom document analysis models.
* For instructions to create a label file for your training forms, please see:
* <a href="https://aka.ms/azsdk/formrecognizer/labelingtool">here</a>.
* <p>
* Further, see AnalyzeDocumentWithClassifier.java to analyze a document with your custom classifer built model.
*/
public class BuildDocumentClassifier {
/**
* Main method to invoke this demo.
*
* @param args Unused arguments to the program.
*/
public static void main(String[] args) {
// Instantiate a client that will be used to call the service.
DocumentModelAdministrationClient client = new DocumentModelAdministrationClientBuilder()
.credential(new AzureKeyCredential("{key}"))
.endpoint("https://{endpoint}.cognitiveservices.azure.com/")
.buildClient();
// Build custom classifier document model
String blobContainerUrl1040D = "{SAS_URL_of_your_container_in_blob_storage}";
String blobContainerUrl1040A = "{SAS_URL_of_your_container_in_blob_storage}";
ContentSource sourceA = new BlobContentSource(blobContainerUrl1040D);
ContentSource sourceB = new BlobContentSource(blobContainerUrl1040A);
HashMap<String, ClassifierDocumentTypeDetails> docTypes = new HashMap<>();
docTypes.put("1040-D", new ClassifierDocumentTypeDetails(sourceA));
docTypes.put("1040-A", new ClassifierDocumentTypeDetails(sourceB));
SyncPoller<OperationResult, DocumentClassifierDetails> buildOperationPoller
= client.beginBuildDocumentClassifier(docTypes);
DocumentClassifierDetails documentClassifierDetails = buildOperationPoller.getFinalResult();
System.out.printf("Classifier ID: %s%n", documentClassifierDetails.getClassifierId());
System.out.printf("Classifier description: %s%n", documentClassifierDetails.getDescription());
System.out.printf("Classifier created on: %s%n", documentClassifierDetails.getCreatedOn());
System.out.printf("Classifier expires on: %s%n", documentClassifierDetails.getExpiresOn());
documentClassifierDetails.getDocumentTypes().forEach((key, documentTypeDetails) -> {
if (documentTypeDetails.getContentSource() instanceof BlobContentSource) {
System.out.printf("Blob Source container Url: %s", ((BlobContentSource) documentTypeDetails
.getContentSource()).getContainerUrl());
}
});
}
}