使用Node JS在Lambda中解析CSV

时间:2017-03-14 16:16:28

标签: node.js csv npm aws-lambda

我正在尝试使用AWS Lambda托管的Node JS解析S3中的CSV文件。我尝试过使用fast-csvcsv-parser npm。但是,我的两个解决方案都会导致Error: write after end导致Lambda函数失败。谢谢你的帮助。

编辑:我在处理程序中声明了流变量。更新了代码。

// dependencies
const csv = require('fast-csv');
const parse = require('csv-parser')
const aws = require('aws-sdk');
const s3 = new aws.S3({ apiVersion: '2006-03-01' });
const uuidv4 = require('uuid/v4');

exports.handler = (event, context, callback) => {
  // read S3 object stream
  var s3Stream = s3.getObject(params, (err, data) => {
    if (err) {
        console.log(err);
        const message = `Error getting object ${key} from bucket ${bucket}. Make sure they exist and your bucket is in the same region as this function.`;
        console.log(message);
        callback(message);
    } else {
        console.log('CONTENT TYPE:', data.ContentType);
        callback(null, data.ContentType);
    }
  }).createReadStream();


  // read CSV with fast-csv
  // options for fast-csv npm
  var options = {
    headers:true,
    escape:'\\',
    trim:true,
  };

  csv.fromStream(s3Stream, options).on("data", function(data) {
    data.id = uuidv4();
    data.createDate = new Date().toISOString();
    console.log(data);
  }).on("error", function(data) {
    console.error("Got an error: " + data);
  }).on("end", function() {
    console.log("Done reading.");
  });


  // read CSV with csv-parser
  var otherOptions = {
    columns : true,
    auto_parse : true,
    escape : '\\',
    trim : true,
  };
  var parser = parse(otherOptions);
  parser.on('data', function(data) {
    data.id = uuidv4();
    data.createDate = new Date().toISOString();
    console.log(data);
  })
  .on('end',function(data) {
    //do something wiht csvData
    console.log(data);
  });
  s3Stream.pipe(parser);
};

1 个答案:

答案 0 :(得分:3)

通过删除回调来修复它:

var s3Stream = s3.getObject(params).createReadStream();

我真的希望他们能很好地记录这些。