Skip to content

Commit

Permalink
DRILL-3071: fix memory leak in RecordBatchLoader#load
Browse files Browse the repository at this point in the history
  • Loading branch information
Hanifi Gunes committed May 14, 2015
1 parent 583ca4a commit f7f6efc
Showing 1 changed file with 62 additions and 52 deletions.
Expand Up @@ -34,18 +34,19 @@

import com.google.common.base.Preconditions;
import com.google.common.collect.Maps;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;

public class RecordBatchLoader implements VectorAccessible, Iterable<VectorWrapper<?>>{
static final org.slf4j.Logger logger = org.slf4j.LoggerFactory.getLogger(RecordBatchLoader.class);
private final static Logger logger = LoggerFactory.getLogger(RecordBatchLoader.class);

private VectorContainer container = new VectorContainer();
private final BufferAllocator allocator;
private VectorContainer container = new VectorContainer();
private int valueCount;
private BatchSchema schema;

public RecordBatchLoader(BufferAllocator allocator) {
super();
this.allocator = allocator;
this.allocator = Preconditions.checkNotNull(allocator);
}

/**
Expand All @@ -60,66 +61,75 @@ public RecordBatchLoader(BufferAllocator allocator) {
* TODO: Clean: DRILL-2933 load(...) never actually throws SchemaChangeException.
*/
public boolean load(RecordBatchDef def, DrillBuf buf) throws SchemaChangeException {
// logger.debug("Loading record batch with def {} and data {}", def, buf);
if (logger.isTraceEnabled()) {
logger.trace("Loading record batch with def {} and data {}", def, buf);
logger.trace("Load, ThreadID: {}", Thread.currentThread().getId(), new RuntimeException("For Stack Trace Only"));
}
container.zeroVectors();
this.valueCount = def.getRecordCount();
valueCount = def.getRecordCount();
boolean schemaChanged = schema == null;
// logger.info("Load, ThreadID: {}", Thread.currentThread().getId(), new RuntimeException("For Stack Trace Only"));
// System.out.println("Load, ThreadId: " + Thread.currentThread().getId());
Map<MaterializedField, ValueVector> oldFields = Maps.newHashMap();
for(VectorWrapper<?> w : container){
ValueVector v = w.getValueVector();
oldFields.put(v.getField(), v);
}

VectorContainer newVectors = new VectorContainer();
final Map<MaterializedField, ValueVector> oldFields = Maps.newHashMap();
for (final VectorWrapper wrapper : container) {
final ValueVector vector = wrapper.getValueVector();
oldFields.put(vector.getField(), vector);
}

List<SerializedField> fields = def.getFieldList();
final VectorContainer newVectors = new VectorContainer();
try {
final List<SerializedField> fields = def.getFieldList();
int bufOffset = 0;
for (final SerializedField field : fields) {
final MaterializedField fieldDef = MaterializedField.create(field);
ValueVector vector = oldFields.remove(fieldDef);

if (vector == null) {
schemaChanged = true;
vector = TypeHelper.getNewVector(fieldDef, allocator);
} else if (!vector.getField().getType().equals(fieldDef.getType())) {
// clear previous vector
vector.clear();
schemaChanged = true;
vector = TypeHelper.getNewVector(fieldDef, allocator);
}

if (field.getValueCount() == 0 && (!field.hasGroupCount() || field.getGroupCount() == 0)) {
AllocationHelper.allocate(vector, 0, 0, 0);
} else {
vector.load(field, buf.slice(bufOffset, field.getBufferLength()));
}
bufOffset += field.getBufferLength();
newVectors.add(vector);
}

int bufOffset = 0;
for (SerializedField fmd : fields) {
MaterializedField fieldDef = MaterializedField.create(fmd);
ValueVector vector = oldFields.remove(fieldDef);
Preconditions.checkArgument(buf == null || bufOffset == buf.capacity());

if (vector == null) {
schemaChanged = true;
vector = TypeHelper.getNewVector(fieldDef, allocator);
} else if (!vector.getField().getType().equals(fieldDef.getType())) {
// clear previous vector
vector.clear();
schemaChanged = true;
vector = TypeHelper.getNewVector(fieldDef, allocator);
// rebuild the schema.
final SchemaBuilder builder = BatchSchema.newBuilder();
for (VectorWrapper<?> v : newVectors) {
builder.addField(v.getField());
}

if (fmd.getValueCount() == 0 && (!fmd.hasGroupCount() || fmd.getGroupCount() == 0)) {
AllocationHelper.allocate(vector, 0, 0, 0);
} else {
vector.load(fmd, buf.slice(bufOffset, fmd.getBufferLength()));
builder.setSelectionVectorMode(BatchSchema.SelectionVectorMode.NONE);
schema = builder.build();
newVectors.buildSchema(BatchSchema.SelectionVectorMode.NONE);
container = newVectors;
} catch (final Throwable cause) {
// We have to clean up new vectors created here and pass over the actual cause. It is upper layer who should
// adjudicate to call upper layer specific clean up logic.
for (final VectorWrapper wrapper:newVectors) {
wrapper.getValueVector().clear();
}
bufOffset += fmd.getBufferLength();
newVectors.add(vector);
}

Preconditions.checkArgument(buf == null || bufOffset == buf.capacity());

if(!oldFields.isEmpty()){
schemaChanged = true;
for(ValueVector v : oldFields.values()){
v.close();
throw cause;
} finally {
if (!oldFields.isEmpty()) {
schemaChanged = true;
for (final ValueVector vector:oldFields.values()) {
vector.clear();
}
}
}

// rebuild the schema.
SchemaBuilder b = BatchSchema.newBuilder();
for(VectorWrapper<?> v : newVectors){
b.addField(v.getField());
}
b.setSelectionVectorMode(BatchSchema.SelectionVectorMode.NONE);
this.schema = b.build();
newVectors.buildSchema(BatchSchema.SelectionVectorMode.NONE);
container = newVectors;
return schemaChanged;

}

public TypedFieldId getValueVectorId(SchemaPath path) {
Expand Down

0 comments on commit f7f6efc

Please sign in to comment.