-
Notifications
You must be signed in to change notification settings - Fork 376
/
TabularDataResourceFormatter.cs
155 lines (128 loc) · 6.16 KB
/
TabularDataResourceFormatter.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
// Copyright(c).NET Foundation and contributors. All rights reserved.
// Licensed under the MIT license. See LICENSE file in the project root for full license information.
using System;
using System.Collections.Generic;
using System.Linq;
using System.Text.Encodings.Web;
using System.Text.Json;
using System.Text.Json.Serialization;
namespace Microsoft.DotNet.Interactive.Formatting.TabularData
{
public static class TabularDataResourceFormatter
{
// https://specs.frictionlessdata.io/table-schema/#language
public const string MimeType = "application/table-schema+json";
static TabularDataResourceFormatter()
{
JsonSerializerOptions = new JsonSerializerOptions(JsonFormatter.SerializerOptions)
{
WriteIndented = true,
NumberHandling = JsonNumberHandling.AllowReadingFromString | JsonNumberHandling.AllowNamedFloatingPointLiterals,
Encoder = JavaScriptEncoder.UnsafeRelaxedJsonEscaping,
ReferenceHandler = null,
Converters =
{
new TableSchemaFieldTypeConverter(),
new TabularDataResourceConverter(),
new DataDictionaryConverter()
}
};
}
public static JsonSerializerOptions JsonSerializerOptions { get; }
internal static ITypeFormatter[] DefaultFormatters { get; } = DefaultTabularDataFormatterSet.DefaultFormatters;
public static TabularDataResource ToTabularDataResource<T>(this IEnumerable<T> source)
{
var (schema, data) = Generate(source);
return new TabularDataResource(schema, data);
}
private static (TableSchema schema, IEnumerable<IDictionary<string, object>> data) Generate<T>(IEnumerable<T> source)
{
var fields = new Dictionary<string, TableSchemaFieldType?>();
var data = new List<IDictionary<string, object>>();
IDestructurer destructurer = default;
foreach (var item in source)
{
switch (item)
{
case IEnumerable<(string name, object value)> valueTuples:
{
var tuples = valueTuples.ToArray();
EnsureFieldsAreInitializedFromValueTuples(tuples);
var obj = new Dictionary<string, object>();
foreach (var (name, value) in tuples)
{
obj.Add(name, value);
}
data.Add(obj);
}
break;
case IEnumerable<KeyValuePair<string, object>> keyValuePairs:
{
var pairs = keyValuePairs.ToArray();
EnsureFieldsAreInitializedFromKeyValuePairs(pairs);
var obj = new Dictionary<string, object>();
foreach (var pair in pairs)
{
obj.Add(pair.Key, pair.Value);
}
data.Add(obj);
}
break;
default:
{
destructurer ??= Destructurer.GetOrCreate(item.GetType());
var dict = destructurer.Destructure(item);
EnsureFieldsAreInitializedFromKeyValuePairs(dict);
data.Add(dict);
}
break;
}
}
var schema = new TableSchema();
foreach (var field in fields)
{
schema.Fields.Add(new TableSchemaFieldDescriptor(field.Key, field.Value));
}
return (schema, data);
void EnsureFieldsAreInitializedFromKeyValuePairs(IEnumerable<KeyValuePair<string, object>> keyValuePairs)
{
foreach (var keyValuePair in keyValuePairs)
{
if (!fields.ContainsKey(keyValuePair.Key))
{
fields.Add(keyValuePair.Key, InferTableSchemaFieldTypeFromValue(keyValuePair.Value));
}
else if (InferTableSchemaFieldTypeFromValue(keyValuePair.Value) is {} type &&
type != TableSchemaFieldType.Null)
{
fields[keyValuePair.Key] = type;
}
}
}
void EnsureFieldsAreInitializedFromValueTuples(IEnumerable<(string name, object value)> valueTuples) => EnsureFieldsAreInitializedFromKeyValuePairs(valueTuples.Select(t => new KeyValuePair<string, object>(t.name, t.value)));
TableSchemaFieldType? InferTableSchemaFieldTypeFromValue(object value) =>
value switch
{
null => null,
_ => value.GetType().ToTableSchemaFieldType()
};
}
public static TableSchemaFieldType ToTableSchemaFieldType(this Type type) =>
type switch
{
{ } t when t == typeof(bool) => TableSchemaFieldType.Boolean,
{ } t when t == typeof(DateTime) => TableSchemaFieldType.DateTime,
{ } t when t == typeof(int) => TableSchemaFieldType.Integer,
{ } t when t == typeof(ushort) => TableSchemaFieldType.Integer,
{ } t when t == typeof(uint) => TableSchemaFieldType.Integer,
{ } t when t == typeof(ulong) => TableSchemaFieldType.Integer,
{ } t when t == typeof(long) => TableSchemaFieldType.Integer,
{ } t when t == typeof(float) => TableSchemaFieldType.Number,
{ } t when t == typeof(double) => TableSchemaFieldType.Number,
{ } t when t == typeof(decimal) => TableSchemaFieldType.Number,
{ } t when t == typeof(string) => TableSchemaFieldType.String,
{ } t when t == typeof(ReadOnlyMemory<char>) => TableSchemaFieldType.String,
_ => TableSchemaFieldType.Any
};
}
}