-
Notifications
You must be signed in to change notification settings - Fork 13k
/
MapOperator.java
91 lines (80 loc) · 3.51 KB
/
MapOperator.java
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.flink.api.java.operators;
import org.apache.flink.annotation.Public;
import org.apache.flink.api.common.functions.MapFunction;
import org.apache.flink.api.common.operators.Operator;
import org.apache.flink.api.common.operators.UnaryOperatorInformation;
import org.apache.flink.api.common.operators.base.MapOperatorBase;
import org.apache.flink.api.common.typeinfo.TypeInformation;
import org.apache.flink.api.java.DataSet;
/**
* This operator represents the application of a "map" function on a data set, and the result data
* set produced by the function.
*
* @param <IN> The type of the data set consumed by the operator.
* @param <OUT> The type of the data set created by the operator.
* @see org.apache.flink.api.common.functions.MapFunction
* @deprecated All Flink DataSet APIs are deprecated since Flink 1.18 and will be removed in a
* future Flink major version. You can still build your application in DataSet, but you should
* move to either the DataStream and/or Table API.
* @see <a href="https://cwiki.apache.org/confluence/pages/viewpage.action?pageId=158866741">
* FLIP-131: Consolidate the user-facing Dataflow SDKs/APIs (and deprecate the DataSet API</a>
*/
@Deprecated
@Public
public class MapOperator<IN, OUT> extends SingleInputUdfOperator<IN, OUT, MapOperator<IN, OUT>> {
protected final MapFunction<IN, OUT> function;
protected final String defaultName;
public MapOperator(
DataSet<IN> input,
TypeInformation<OUT> resultType,
MapFunction<IN, OUT> function,
String defaultName) {
super(input, resultType);
this.defaultName = defaultName;
this.function = function;
}
@Override
protected MapFunction<IN, OUT> getFunction() {
return function;
}
@Override
protected MapOperatorBase<IN, OUT, MapFunction<IN, OUT>> translateToDataFlow(
Operator<IN> input) {
String name = getName() != null ? getName() : "Map at " + defaultName;
// create operator
MapOperatorBase<IN, OUT, MapFunction<IN, OUT>> po =
new MapOperatorBase<IN, OUT, MapFunction<IN, OUT>>(
function,
new UnaryOperatorInformation<IN, OUT>(getInputType(), getResultType()),
name);
// set input
po.setInput(input);
// set parallelism
if (this.getParallelism() > 0) {
// use specified parallelism
po.setParallelism(this.getParallelism());
} else {
// if no parallelism has been specified, use parallelism of input operator to enable
// chaining
po.setParallelism(input.getParallelism());
}
return po;
}
}