首页 > 解决方案 > DynamoDB // Lambda // 不一致的记录


我们根据事件将数据从我们的应用程序推送到 DynamoDB。我们编写了一个映射到这个 DynamoDB 表的 lambda 函数。我们在应用程序中更新的记录成功发送到 DyanamoDB。但是,lambda 通常时间给出的记录数较少。

如果我们的应用程序中更新了 3 条记录,则所有 3 条记录都会被推送到 Dynamo,但 lambda 有时只给出两条或一条。

我们在 lambda 函数中构建了一个 csv 文件,因此 csv 文件的记录数也更少。

我可以分享一些代码片段,但如果这与 Lambda 配置或我们用来将数据推送到 Dynamo 的 Dynamo API 相关,我一无所知?

以下是 Lambda 代码:

public class ProductLambda implements RequestHandler<DynamodbEvent, String> {
    private static final String M_NUM = "number";
    private static final String FT_TABLE = "table";
    private AmazonS3 s3 = 
    private static final String S3_BUCKET = "bucket";
    private static final String S3_FOLDER = "folder";

public ProductLambda() {

public String handleRequest(DynamodbEvent event, Context context) {
    String[] appcol = new String[] {"COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4"};
    String[] fttcol = new String[] {"COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4"};
    createFolder(S3_BUCKET, S3_FOLDER, s3);
    List<DynamodbStreamRecord> records = event.getRecords();
    try {
        List<LinkedHashMap<String, AttributeValue>> changedRecords = new ArrayList<LinkedHashMap<String, AttributeValue>>();
        String ddbTable = "";
        for (DynamodbStreamRecord record : records) {
            String modelNumber = "";
            String ddbARN = record.getEventSourceARN();
            if (ddbARN != null) {
                ddbTable = ddbARN.split("/")[1];
            if (record != null) {
                Map<String, AttributeValue> changedRec = record.getDynamodb().getNewImage();
                if (changedRec != null) {
                    if (ddbTable.equalsIgnoreCase("table1")) {
                        LinkedHashMap<String, AttributeValue> staticColumnRecord = new LinkedHashMap<String, AttributeValue>();
                        List<String> list1 = new ArrayList<String>(Arrays.asList(appcol));
                        for (String key : list1) {
                            AttributeValue value = changedRec.get(key);
                            if (value != null) {
                                staticColumnRecord.put(key, value);
                            } else {
                                staticColumnRecord.put(key, new AttributeValue().withS("null"));
                    if (ddbTable.equalsIgnoreCase("table2")) {
                        LinkedHashMap<String, AttributeValue> staticColumnRecord = new LinkedHashMap<String, AttributeValue>();
                        List<String> list2 = new ArrayList<String>(Arrays.asList(fttcol));
                        for (String key : list2) {
                            AttributeValue value = changedRec.get(key);
                                modelNumber = value.getS();
                            if (value != null) {
                                staticColumnRecord.put(key, value);
                            } else {
                                staticColumnRecord.put(key, new AttributeValue().withS("null"));
                        staticColumnRecord = getModelDetails(staticColumnRecord,modelNumber);
        context.getLogger().log("[DEBUG] - Total Records Changed: " + changedRecords.size());
        buildAndUploadCSV(changedRecords, context, ddbTable);
    } catch (AmazonServiceException e) {
        context.getLogger().log("[ERROR] - AmazonServiceException " + e);
    } catch (AmazonClientException e) {
        context.getLogger().log("[ERROR] - AmazonClientException " + e);
    } catch (IOException e) {
        context.getLogger().log("[ERROR] - IOException " + e);
    context.getLogger().log("[DEBUG] - Total Records are: " + records.size());
    return "Total records are: " + records.size();

 * @param staticColumnRecord
 * @param modelNumber
 * @param context
 * @return
private LinkedHashMap<String, AttributeValue> getModelDetails(LinkedHashMap<String, AttributeValue> staticColumnRecord,
        String modelNumber) {

    String[] modcol = new String[] { "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4", "COL1", "COL2", "COL3", "COL4" };
    if (!modelNumber.isEmpty()) {
        AmazonDynamoDB dynamoClient = AmazonDynamoDBClientBuilder.standard().build();
        GetItemRequest getItemRequest = new GetItemRequest().withTableName(FT_TABLE)
                .addKeyEntry(M_NUM, new AttributeValue().withS(modelNumber));
        Map<String, AttributeValue> responseItem = dynamoClient.getItem(getItemRequest).getItem();
        List<String> sf_mode_col = new ArrayList<String>(Arrays.asList(modcol));
        if (responseItem != null) {
            for (String key : sf_mode_col) {
                AttributeValue val = responseItem.get(key);
                if (val != null) {
                    staticColumnRecord.put(key, val);
                } else {
                    staticColumnRecord.put(key, new AttributeValue().withS("null"));
    return staticColumnRecord;

 * Creates a folder in the S3 bucket.
private static void createFolder(String bucketName, String folderName, AmazonS3 client) {
    ObjectMetadata metadata = new ObjectMetadata();
    InputStream emptyContent = new ByteArrayInputStream(new byte[0]);
    PutObjectRequest putObjectRequest = new PutObjectRequest(bucketName, folderName, emptyContent, metadata);
    PutObjectResult result = client.putObject(putObjectRequest);

 * Build CSV file of changed data and upload to S3 bucket.
private void buildAndUploadCSV(List<LinkedHashMap<String, AttributeValue>> changedRecords, Context context, String tableName)
        throws IOException {
    Calendar calendar = Calendar.getInstance();
    SimpleDateFormat formatter = new SimpleDateFormat("yyyyMMddHHmmss");
    String outputName = tableName + "_" + formatter.format(calendar.getTime()) + ".csv";
    List<String> headers = changedRecords.stream().flatMap(map -> map.keySet().stream()).distinct()
    Path filePath = Paths.get("/tmp", outputName);
    try (OutputStreamWriter bw = new OutputStreamWriter(new FileOutputStream(filePath.toFile()), StandardCharsets.UTF_8)) 
        StringBuffer headerContent = new StringBuffer();
        for (String string : headers) {
        if (headerContent.length() > 0  && headerContent.charAt(headerContent.length() - 1) == ',')
            headerContent.setLength( headerContent.length() - 1 );

        StringBuffer strBuilder = new StringBuffer();
        for (LinkedHashMap<String, AttributeValue> lmap : changedRecords) {
            StringBuilder stringBuilder = new StringBuilder("");
            String sep = "";
            for (Entry<String, AttributeValue> string2 : lmap.entrySet()) {
                String value = string2.getValue().getS();
                sep = ",";
            if (!stringBuilder.toString().isEmpty()) {
        ByteArrayInputStream contentsAsStream = new ByteArrayInputStream(headerContent.toString().getBytes());
        ObjectMetadata md = new ObjectMetadata();   
        PutObjectRequest request = new PutObjectRequest("bucket", "folder/" + outputName,
                contentsAsStream, md);
    } catch (IOException e) {
        context.getLogger().log("[ERROR] - IOException " + e);


标签: aws-lambdaamazon-dynamodbaws-java-sdk

