TransposeVertexGroupItems.java
/*
* Copyright © 2014 - 2021 Leipzig University (Database Research Group)
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.gradoop.flink.model.impl.operators.grouping.functions;
import org.apache.flink.api.common.functions.GroupReduceFunction;
import org.apache.flink.api.java.functions.FunctionAnnotation;
import org.apache.flink.api.java.tuple.Tuple2;
import org.apache.flink.util.Collector;
import org.gradoop.common.model.impl.id.GradoopId;
import org.gradoop.common.model.impl.id.GradoopIdSet;
import org.gradoop.flink.model.impl.operators.grouping.tuples.LabelGroup;
import org.gradoop.flink.model.impl.operators.grouping.tuples.VertexGroupItem;
import org.gradoop.common.model.impl.properties.PropertyValueList;
import org.gradoop.flink.model.impl.tuples.IdWithIdSet;
import java.util.HashSet;
import java.util.Set;
/**
* Takes a group of {@link VertexGroupItem} as input where each item represents
* the same group but stores a unique super vertex ids. This function creates
* a single {@link VertexGroupItem} that represents the whole group and also
* outputs a set containing all the super vertex ids of the incoming items.
*
* Example input:
* (1,A)
* (2,A)
* (3,B)
* (4,B)
*
* Example output:
* ((10,A),(10,[1,2]))
* ((20,B),(20,[3,4]))
*/
@FunctionAnnotation.ForwardedFields(
"f0->f0.f0;" + // vertexId
"f2->f0.f2;" + // label
"f3->f0.f3;" + // properties
"f6->f0.f6" // label group
)
@FunctionAnnotation.ReadFields("f4")
public class TransposeVertexGroupItems
extends ReduceVertexGroupItemBase
implements GroupReduceFunction<VertexGroupItem, Tuple2<VertexGroupItem, IdWithIdSet>> {
/**
* Reduce object instantiation
*/
private final Tuple2<VertexGroupItem, IdWithIdSet> reuseOuterTuple;
/**
* Reduce object instantiation
*/
private final IdWithIdSet reuseInnerTuple;
/**
* Creates group reduce function.
*
* @param useLabel true, iff labels are used for grouping
*/
public TransposeVertexGroupItems(boolean useLabel) {
super(useLabel);
this.reuseOuterTuple = new Tuple2<>();
this.reuseInnerTuple = new IdWithIdSet();
}
@Override
public void reduce(Iterable<VertexGroupItem> vertexGroupItems,
Collector<Tuple2<VertexGroupItem, IdWithIdSet>> out)
throws Exception {
GradoopId superVertexId = null;
String groupLabel = null;
PropertyValueList groupPropertyValues = null;
LabelGroup vertexLabelGroup = null;
boolean isFirst = true;
Set<GradoopId> superVertexIds = new HashSet<>();
for (VertexGroupItem groupItem : vertexGroupItems) {
if (isFirst) {
superVertexId = GradoopId.get();
groupLabel = groupItem.getGroupLabel();
groupPropertyValues = groupItem.getGroupingValues();
vertexLabelGroup = groupItem.getLabelGroup();
isFirst = false;
}
// store the super vertex id created in the previous combiner
superVertexIds.add(groupItem.getSuperVertexId());
vertexLabelGroup.aggregate(groupItem.getAggregateValues());
}
reuseInnerTuple.setId(superVertexId);
reuseInnerTuple.setIdSet(GradoopIdSet.fromExisting(superVertexIds));
reuseOuterTuple.f0 = createSuperVertexTuple(superVertexId, groupLabel,
groupPropertyValues, vertexLabelGroup.getAggregateValueList());
reuseOuterTuple.f0.setSuperVertexId(superVertexId);
reuseOuterTuple.f0.setLabelGroup(vertexLabelGroup);
reuseOuterTuple.f1 = reuseInnerTuple;
// collect single item representing the whole group
reuseOuterTuple.f0.getLabelGroup().resetAggregateValues();
out.collect(reuseOuterTuple);
}
}