首页 > 解决方案 > 如何在异步函数中创建 AWS S3 对象的读取流?

问题描述

如何在异步函数中创建 AWS S3 对象的读取流?

如果我尝试

exports.handler = async (event) => {
  var csvreadstream = await s3.getObject({ Bucket: bucket, Key: filename }).promise().createReadStream()
}

或者

exports.handler = async (event) => {
  var s3Object = await s3.getObject({ Bucket: bucket, Key: filename }).promise();
  var csvreadstream = s3Object.createReadStream();
}

我明白了

{
  "errorType": "TypeError",
  "errorMessage": "(intermediate value).createReadStream is not a function",
  "trace": [
    "TypeError: (intermediate value).createReadStream is not a function",
    "    at Runtime.exports.handler (/var/task/app.js:29:86)",
    "    at processTicksAndRejections (internal/process/task_queues.js:94:5)"
  ]
}

谁能建议如何以异步(异步/等待方式)函数从 S3 对象创建读取流?谢谢!

感谢 Mark BI,我更进一步:

const AWS = require('aws-sdk');
const utils = require('./utils');
const csv = require('fast-csv');
const stream = require('stream');
const s3 = new AWS.S3();

exports.handler = async (event) => {
    console.log("Incoming Event: ", JSON.stringify(event));
    const bucket = event.Records[0].s3.bucket.name;
    const filename = decodeURIComponent(event.Records[0].s3.object.key.replace(/\+/g, ' '));
    const message = `File is uploaded in - ${bucket} -> ${filename}`;
    console.log(message);
    
    var errors = [];

    const splittedFilename = filename.split('.');
    const reportFilename = splittedFilename[0] + "Report." + splittedFilename[1];
    const reportBucket = 'external.transactions.reports';
    
    var s3object = (await s3.getObject({ Bucket: bucket, Key: filename }).promise());
    var csvreadstream = new stream.Readable();
    csvreadstream._read = () => {};
    csvreadstream.push(s3object.Body);
   
    csvreadstream
    .pipe(csv.parse({ headers: true }))
    .on('data', async function(data){
        this.pause();
        console.log("DATA: " + data);
        await utils.filterLogic(data, errors);
        this.resume();
    })
    .on('end', async function(){
        console.log("END");
        await utils.writeErrorReport(errors, s3, reportBucket, reportFilename);
    })
};

但是,流似乎没有得到处理,例如调用.on() 是否有人建议如何在异步函数中处理读取流?非常感谢您的医治。

标签: node.jsamazon-web-servicesamazon-s3aws-lambdaasync-await

解决方案


派对迟到了,但我相信你只是想做:

var readableStream = await s3.getObject({ Bucket: bucket, Key: filename }).createReadStream();

这将返回一个可读流,而无需使用 .promise() 预先下载整个对象并等待它被解析,然后在下载整个缓冲区之后手动将其转换为可读流。


推荐阅读