forked from rai-project/evaluation
/
gpu_kernel_name_aggre_info.go
78 lines (67 loc) · 1.79 KB
/
gpu_kernel_name_aggre_info.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
package cmd
import (
"os"
"path/filepath"
"sort"
"strings"
"github.com/c3sr/evaluation"
"github.com/spf13/cobra"
)
var gpuKernelNameAggreInfoCmd = &cobra.Command{
Use: "name_aggre_info",
Aliases: []string{},
Short: "Get gpu information aggregated by name from system library traces in a database. Specify model name as `all` to list information of all the models.",
PreRunE: func(cmd *cobra.Command, args []string) error {
if databaseName == "" {
databaseName = defaultDatabaseName["cuda_kernel"]
}
err := rootSetup()
if err != nil {
return err
}
if modelName == "all" && outputFormat == "json" && outputFileName == "" {
outputFileName = filepath.Join(mlArcWebAssetsPath, "cuda_kernel_launch")
}
if overwrite && isExists(outputFileName) {
os.RemoveAll(outputFileName)
}
if kernelNameFilterString != "" {
kernelNameFilterList = strings.Split(kernelNameFilterString, ",")
}
return nil
},
RunE: func(cmd *cobra.Command, args []string) error {
run := func() error {
evals, err := getEvaluations()
if err != nil {
return err
}
gpuKernelInfos, err := evals.SummaryGPUKernelNameAggreInformations(performanceCollection)
if err != nil {
return err
}
if sortOutput || topKernels != -1 {
sort.Sort(gpuKernelInfos)
if topKernels != -1 {
if topKernels >= len(gpuKernelInfos) {
topKernels = len(gpuKernelInfos)
}
gpuKernelInfos = gpuKernelInfos[:topKernels]
}
}
var writer *Writer
if len(gpuKernelInfos) == 0 {
writer = NewWriter(evaluation.SummaryGPUKernelInformation{})
defer writer.Close()
return nil
}
writer = NewWriter(gpuKernelInfos[0])
defer writer.Close()
for _, elem := range gpuKernelInfos {
writer.Row(elem)
}
return nil
}
return forallmodels(run)
},
}