Skip to content

Commit

Permalink
Fix for bug that causes memory overrun and adds more rows than it should
Browse files Browse the repository at this point in the history
  • Loading branch information
Arnab Gupta committed Jun 10, 2020
1 parent 641cdbc commit caec575
Show file tree
Hide file tree
Showing 2 changed files with 10 additions and 6 deletions.
12 changes: 9 additions & 3 deletions lib/writer.js
Original file line number Diff line number Diff line change
Expand Up @@ -94,8 +94,11 @@ class ParquetWriter {
parquet_shredder.shredRecord(this.schema, row, this.rowBuffer);

if (this.rowBuffer.rowCount >= this.rowGroupSize) {
await this.envelopeWriter.writeRowGroup(this.rowBuffer);
let to_write = this.rowBuffer;
let rowCount = this.rowBuffer.rowCount;
this.rowBuffer = {};
to_write.rowCount = rowCount;
await this.envelopeWriter.writeRowGroup(to_write);
}
}

Expand All @@ -112,9 +115,12 @@ class ParquetWriter {

this.closed = true;

if (this.rowBuffer.rowCount > 0 || this.rowBuffer.rowCount >= this.rowGroupSize) {
await this.envelopeWriter.writeRowGroup(this.rowBuffer);
if (this.rowBuffer.rowCount > 0) {
let to_write = this.rowBuffer;
let rowCount = this.rowBuffer.rowCount;
this.rowBuffer = {};
to_write.rowCount = rowCount;
await this.envelopeWriter.writeRowGroup(to_write);
}

await this.envelopeWriter.writeFooter(this.userMetadata);
Expand Down
4 changes: 1 addition & 3 deletions test/integration.js
Original file line number Diff line number Diff line change
Expand Up @@ -105,9 +105,7 @@ async function writeTestFile(opts) {

let rows = mkTestRows(opts);

for (let row of rows) {
await writer.appendRow(row);
}
rows.forEach(async row => await writer.appendRow(row));

await writer.close();
}
Expand Down

0 comments on commit caec575

Please sign in to comment.