我需要从URL(PDF)获取文件并保存它们,然后存储在使用缓冲区的备用文件系统中。我发现get适用于url,文件保存在本地,但当我尝试获取缓冲区时,缓冲区是空的。
当我第二次运行时,文件已经保存,然后它就可以工作了。我认为这与以某种方式关闭文件有关。有人有什么想法吗?我的代码如下-
function savefile(filename, url) { const file = fs.createWriteStream(filename); const request = https.get(url, function(response) { response.pipe(file); console.log("file saved"); return file; });; } app.post('/addfile', function(req, res) { var filename = req.body.filename; var url = req.body.url; var file = savefile(filename, url); let testFile = fs.readFileSync(filename); let testBuffer = new Buffer(testFile); // process testBuffer
我认为这里的问题是,当您调用savefile时,它会在数据被读取并保存到磁盘之前返回。
这意味着当您调用fs时。readFileSync,文件数据尚不存在。文件出现之前可能还需要几百毫秒。记住https。get函数没有阻塞(就像Node.js中的大多数I/O函数一样)。
因此,最好的方法是使用回调函数来指示何时完成,或者使用promise。我通常更喜欢后者,因为代码语法更简洁。
例如(有一个promise):
function savefileWithPromise(filename, url) {
return new Promise((resolve, reject) => {
// Create file and setup close handler.
const file = fs.createWriteStream(filename)
.on('close', () => resolve("File end"));
// Read data from url..the file.close handler will fire when the response has been piped to the file stream.
https.get(url, function(response) {
response.pipe(file);
});
});
}
app.post('/addfile', async function(req, res) {
var filename = req.body.filename;
var url = req.body.url;
console.log(`/addfile: Reading from url: ${url}, writing to file ${filename}...`);
await savefileWithPromise(filename, url);
// readFileSync returns a buffer.
let testFile = fs.readFileSync(filename);
console.log("File length: " + testFile.length + " byte(s).")
res.status(200).send("ok");
});
我们还可以对回调执行相同的操作:
function savefileWithCallback(filename, url, callback) {
// Create file and setup close handler.
const file = fs.createWriteStream(filename)
.on('close', () => callback("File end"));
// Read data from url..
https.get(url, function(response) {
response.pipe(file);
});
}
app.post('/addfile', function(req, res) {
var filename = req.body.filename;
var url = req.body.url;
console.log(`/addfile: Reading from url: ${url}, writing to file ${filename}...`);
savefileWithCallback(filename, url, function() {
// readFileSync returns a buffer.
let testFile = fs.readFileSync(filename);
console.log("File length: " + testFile.length + " byte(s).")
res.status(200).send("ok");
});
});
然后简单地读取url数据到缓冲区:
function readUrlDataToBuffer(url) {
return new Promise((resolve, reject) => {
https.get(url, function(response) {
const data = [];
response.on('data', function(chunk) {
data.push(chunk);
}).on('end', function() {
resolve(Buffer.concat(data));
})
}).on('error', function(err) {
reject(err);
});
});
}
app.post('/addfile', async function(req, res) {
try {
var url = req.body.url;
console.log(`/addfile: Reading from url: ${url}..`);
let buffer = await readUrlDataToBuffer(url);
console.log("Buffer length: " + buffer.length + " byte(s).");
res.send('ok');
} catch (error) {
res.status(500).send('An error occurred');
}
});