I'm writing a large file with node.js using a writable stream: <pre class="prettyprint"><code>var fs = require('fs'); var stream = fs.createWriteStream('someFile.txt', { flags : 'w' }); var lines; while (lines = getLines()) { for (var i = 0; i < lines.length; i++) { stream.write( lines[i] ); } } </code></pre> I'm wondering if this scheme is safe without using <code>drain</code> event? If it is not (which I think is the case), what is the pattern for writing an arbitrary large data to a file?

The idea behind drain is that you would use it to test here: <pre class="prettyprint"><code>var fs = require('fs'); var stream = fs.createWriteStream('someFile.txt', {flags: 'w'}); var lines; while (lines = getLines()) { for (var i = 0; i < lines.length; i++) { stream.write(lines[i]); //<-- the place to test } } </code></pre> which you're not. So you would need to rearchitect to make it "reentrant". <pre class="prettyprint"><code>var fs = require('fs'); var stream = fs.createWriteStream('someFile.txt', {flags: 'w'}); var lines; while (lines = getLines()) { for (var i = 0; i < lines.length; i++) { var written = stream.write(lines[i]); //<-- the place to test if (!written){ //do something here to wait till you can safely write again //this means prepare a buffer and wait till you can come back to finish // lines[i] -> remainder } } } </code></pre> However, does this mean that you need to keep buffering getLines as well while you wait? <pre class="prettyprint"><code>var fs = require('fs'); var stream = fs.createWriteStream('someFile.txt', {flags: 'w'}); var lines, buffer = { remainingLines = [] }; while (lines = getLines()) { for (var i = 0; i < lines.length; i++) { var written = stream.write(lines[i]); //<-- the place to test if (!written){ //do something here to wait till you can safely write again //this means prepare a buffer and wait till you can come back to finish // lines[i] -> remainder buffer.remainingLines = lines.slice(i); break; //notice there's no way to re-run this once we leave here. } } } stream.on('drain',function(){ if (buffer.remainingLines.length){ for (var i = 0; i < buffer.remainingLines.length; i++) { var written = stream.write(buffer.remainingLines[i]); //<-- the place to test if (!written){ //do something here to wait till you can safely write again //this means prepare a buffer and wait till you can come back to finish // lines[i] -> remainder buffer.remainingLines = lines.slice(i); } } } }); </code></pre>

Writing large files with Node.js

Tags:

node.js

large-files

I'm writing a large file with node.js using a writable stream:

var fs     = require('fs'); var stream = fs.createWriteStream('someFile.txt', { flags : 'w' });  var lines; while (lines = getLines()) {     for (var i = 0; i < lines.length; i++) {         stream.write( lines[i] );     } }

I'm wondering if this scheme is safe without using drain event? If it is not (which I think is the case), what is the pattern for writing an arbitrary large data to a file?

686

asked Feb 28 '12 17:02

nab

2 Answers

That's how I finally did it. The idea behind is to create readable stream implementing ReadStream interface and then use pipe() method to pipe data to writable stream.

var fs = require('fs'); var writeStream = fs.createWriteStream('someFile.txt', { flags : 'w' }); var readStream = new MyReadStream();  readStream.pipe(writeStream); writeStream.on('close', function () {     console.log('All done!'); });

The example of MyReadStream class can be taken from mongoose QueryStream.

195

answered Sep 27 '22 18:09

nab

The idea behind drain is that you would use it to test here:

var fs = require('fs'); var stream = fs.createWriteStream('someFile.txt', {flags: 'w'});  var lines; while (lines = getLines()) {     for (var i = 0; i < lines.length; i++) {         stream.write(lines[i]); //<-- the place to test     } }

which you're not. So you would need to rearchitect to make it "reentrant".

var fs = require('fs'); var stream = fs.createWriteStream('someFile.txt', {flags: 'w'});  var lines; while (lines = getLines()) {     for (var i = 0; i < lines.length; i++) {         var written = stream.write(lines[i]); //<-- the place to test         if (!written){            //do something here to wait till you can safely write again            //this means prepare a buffer and wait till you can come back to finish            //  lines[i] -> remainder         }     } }

However, does this mean that you need to keep buffering getLines as well while you wait?

var fs = require('fs'); var stream = fs.createWriteStream('someFile.txt', {flags: 'w'});  var lines,     buffer = {      remainingLines = []     }; while (lines = getLines()) {     for (var i = 0; i < lines.length; i++) {         var written = stream.write(lines[i]); //<-- the place to test         if (!written){            //do something here to wait till you can safely write again            //this means prepare a buffer and wait till you can come back to finish            //  lines[i] -> remainder            buffer.remainingLines = lines.slice(i);            break;            //notice there's no way to re-run this once we leave here.         }     } }  stream.on('drain',function(){   if (buffer.remainingLines.length){     for (var i = 0; i < buffer.remainingLines.length; i++) {       var written = stream.write(buffer.remainingLines[i]); //<-- the place to test       if (!written){        //do something here to wait till you can safely write again        //this means prepare a buffer and wait till you can come back to finish        //  lines[i] -> remainder        buffer.remainingLines = lines.slice(i);       }     }   } });

answered Sep 27 '22 18:09

jcolebrand

Related questions
                            
                                Multiplayer game with JavaScript backend and frontend. What are the best practices?
                            
                                Are there significant differences between the Chrome browser event loop versus the node event loop?
                            
                                monitoring a node.js server [closed]
                            
                                Node.js, PHP, Javascript Confusion [duplicate]
                            
                                NodeJs stress testing tools/methods [closed]
                            
                                node.js: Mock http request and response
                            
                                What does "res.render" do, and what does the html file look like?
                            
                                How to send a POST request from node.js Express?
                            
                                Connect synchronously to mongodb
                            
                                NodeJS write binary buffer into a file
                            
                                What is colon : in npm script names?
                            
                                socket.io: send message to specific room (client side)
                            
                                How to add Google Authenticator to my website?
                            
                                'Directory import is not supported resolving ES modules' with Node.js
                            
                                Can I run a private npm repository without replicating the public repository?
                            
                                lessc binary not available after installing less via NPM
                            
                                Working with Sessions in Express.js
                            
                                What does double parentheses mean in a require
                            
                                Why cookies and set-cookie headers can't be set while making xmlhttprequest using setRequestHeader?
                            
                                what the difference between qs and querystring

Donate For Us

If you love us? You can donate to us via Paypal or buy me a coffee so we can maintain and grow! Thank you!

Donate Us With