Javascript 使用 node.js 下载大文件避免高内存消耗

Question

提问by Carlosedp

I`m trying to create a file downloader as a background service but when a large file is scheduled, it's first put in memory and then, at the end of the download the file is written to disk.

我正在尝试创建一个文件下载器作为后台服务，但是当一个大文件被安排时，它首先被放入内存中，然后在下载结束时将文件写入磁盘。

How can I make the file be wrote gradually to the disk preserving memory considering that I may have lots of files being downloaded at the same time?

考虑到我可能同时下载很多文件，如何使文件逐渐写入磁盘保存内存？

Here's the code I`m using:

这是我正在使用的代码：

var sys = require("sys"),
    http = require("http"),
    url = require("url"),
    path = require("path"),
    fs = require("fs"),
    events = require("events");

var downloadfile = "http://nodejs.org/dist/node-v0.2.6.tar.gz";

var host = url.parse(downloadfile).hostname
var filename = url.parse(downloadfile).pathname.split("/").pop()

var theurl = http.createClient(80, host);
var requestUrl = downloadfile;
sys.puts("Downloading file: " + filename);
sys.puts("Before download request");
var request = theurl.request('GET', requestUrl, {"host": host});
request.end();

var dlprogress = 0;


setInterval(function () {
   sys.puts("Download progress: " + dlprogress + " bytes");
}, 1000);


request.addListener('response', function (response) {
    response.setEncoding('binary')
    sys.puts("File size: " + response.headers['content-length'] + " bytes.")
    var body = '';
    response.addListener('data', function (chunk) {
        dlprogress += chunk.length;
        body += chunk;
    });
    response.addListener("end", function() {
        fs.writeFileSync(filename, body, 'binary');
        sys.puts("After download finished");
    });

});

Answer 1

采纳答案by Carlosedp

I changed the callback to:

我将回调更改为：

request.addListener('response', function (response) {
        var downloadfile = fs.createWriteStream(filename, {'flags': 'a'});
        sys.puts("File size " + filename + ": " + response.headers['content-length'] + " bytes.");
        response.addListener('data', function (chunk) {
            dlprogress += chunk.length;
            downloadfile.write(chunk, encoding='binary');
        });
        response.addListener("end", function() {
            downloadfile.end();
            sys.puts("Finished downloading " + filename);
        });

    });

This worked perfectly.

这工作得很好。

Answer 2

回答by LeeGee

Take a look at http-request:

看看http-request：

// shorthand syntax, buffered response
http.get('http://localhost/get', function (err, res) {
    if (err) throw err;
    console.log(res.code, res.headers, res.buffer.toString());
});

// save the response to 'myfile.bin' with a progress callback
http.get({
    url: 'http://localhost/get',
    progress: function (current, total) {
        console.log('downloaded %d bytes from %d', current, total);
    }
}, 'myfile.bin', function (err, res) {
    if (err) throw err;
    console.log(res.code, res.headers, res.file);
});

Answer 3

回答by Carter Cole

does the request package work for your uses?

请求包是否适合您的用途？

it lets you do things like this:

它可以让你做这样的事情：

request(downloadurl).pipe(fs.createWriteStream(downloadtohere))

Answer 4

回答by Munipratap

When downloading large file please use fs.writeand not writeFileas it will override the previous content.

下载大文件时请使用fs.write而不是writeFile因为它会覆盖以前的内容。

function downloadfile(res) {
    var requestserver = http.request(options, function(r) {
        console.log('STATUS: ' + r.statusCode);
        console.log('HEADERS: ' + JSON.stringify(r.headers));

        var fd = fs.openSync('sai.tar.gz', 'w');

        r.on('data', function (chunk) {
            size += chunk.length;
            console.log(size+'bytes received');
            sendstatus(res,size);
            fs.write(fd, chunk, 0, chunk.length, null, function(er, written) {
            });
        });
        r.on('end',function(){
            console.log('\nended from server');
            fs.closeSync(fd);
            sendendstatus(res);
        });
    });
}

Answer 5

回答by mhitza

Instead of holding the content into memory in the "data"event listener you should write to the file in append mode.

"data"您应该以追加模式写入文件，而不是在事件侦听器中将内容保存到内存中。

Answer 6

回答by Noah

Use streams like Carter Cole suggested. Here is a more complete example

使用 Carter Cole 建议的流。这是一个更完整的例子

var inspect = require('eyespect').inspector();
var request = require('request');
var filed = require('filed');
var temp = require('temp');
var downloadURL = 'http://upload.wikimedia.org/wikipedia/commons/e/ec/Hazard_Creek_Kayaker.JPG';
var downloadPath = temp.path({prefix: 'singlePageRaw', suffix: '.jpg'});

var downloadFile = filed(downloadPath);
var r = request(downloadURL).pipe(downloadFile);


r.on('data', function(data) {
  inspect('binary data received');
});
downloadFile.on('end', function () {
  inspect(downloadPath, 'file downloaded to path');
});

downloadFile.on('error', function (err) {
  inspect(err, 'error downloading file');
});

You may need to install modules which you can do via npm install filed request eyespect temp

您可能需要安装模块，您可以通过 npm install filed request eyespect temp

Javascript 使用 node.js 下载大文件避免高内存消耗

提问by Carlosedp

采纳答案by Carlosedp

回答by LeeGee

回答by Carter Cole

回答by Munipratap

回答by mhitza

回答by Noah

相关推荐

最近更新

标签

Javascript 使用 node.js 下载大文件避免高内存消耗

提问by Carlosedp

采纳答案by Carlosedp

回答by LeeGee

回答by Carter Cole

回答by Munipratap

回答by mhitza

回答by Noah

相关推荐

Javascript - 重新索引数组

Javascript toBe(true) vs toBeTruthy() vs toBeTrue()

仅使用 Javascript 使用 Bit.ly API 缩小 URL

使用 javascript 从谷歌图片中获取随机图片

相关推荐

最近更新

标签