简体   繁体   English

MongoDB聚合两个不同的组

[英]MongoDB Aggregate two different groups

I have data set and i need two diffrent group by values from that data set. 我有数据集,我需要该数据集的两个不同的按值分组。 please find the data set below, 请在下面找到数据集,

[{
    "ASSIGN_ID": "583f84bce58725f76b322398",
    "SPEC_ID": "58411772",
    "STATUS": 1,
    "UPDATE_DATE": ISODate("2016-12-21T04:10:23.000Z")
  },
  {
    "ASSIGN_ID": "583f84bce58725f76b322398",
    "SPEC_ID": "58411772",
    "STATUS": 4,
    "UPDATE_DATE": ISODate("2016-12-22T04:10:23.000Z")
  },
  {
    "ASSIGN_ID": "583f84bce58725f76b322398",
    "SPEC_ID": "58411772",
    "STATUS": 4,
    "UPDATE_DATE": ISODate("2016-12-23T04:10:23.000Z")
  },
  {
    "ASSIGN_ID": "583f84bce58725f76b322398",
    "SPEC_ID": "58411774",
    "STATUS": 3,
    "UPDATE_DATE": ISODate("2016-12-24T04:10:23.000Z")
  },
  {
    "ASSIGN_ID": "583f84bce58725f76b322311",
    "SPEC_ID": "58411775",
    "STATUS": 1,
    "UPDATE_DATE": ISODate("2016-12-25T04:10:23.000Z")
  },
  {
    "ASSIGN_ID": "583f84bce58725f76b322311",
    "SPEC_ID": "58411775",
    "STATUS": 3,
    "UPDATE_DATE": ISODate("2016-12-23T04:10:23.000Z")
  },
  {
    "ASSIGN_ID": "583f84bce58725f76b322322",
    "SPEC_ID": "58411774",
    "STATUS": 1,
    "UPDATE_DATE": ISODate("2016-12-20T04:10:23.000Z")
  },
  {
    "ASSIGN_ID": "583f84bce58725f76b322322",
    "SPEC_ID": "58411778",
    "STATUS": 4,
    "UPDATE_DATE": ISODate("2016-12-21T04:10:23.000Z")
  }
]

I want to group this by using ASSIGN_ID and STATUS and also inside each ASSIGN_ID group I need SPEC_ID and also by STATUS . 我想通过使用ASSIGN_IDSTATUS对此进行分组 ,并且在每个ASSIGN_ID组内部也需要SPEC_ID并通过STATUS进行分组。 please find the expected output below, 请在下面找到预期的输出,

[{
    "ASSIGN_ID": "583f84bce58725f76b322398",
    "ASSIGN_GROUP": [{
        "STATUS": 1,
        "COUNT": 1
      },
      {
        "STATUS": 3,
        "COUNT": 1
      },
      {
        "STATUS": 4,
        "COUNT": 2
      }
    ],
    "SPEC_ARRAY": [{
        "SPEC_ID": "58411772",
        "SPEC_GROUP": [{
            "STATUS": 1,
            "COUNT": 1
          },
          {
            "STATUS": 4,
            "COUNT": 2
          }
        ]
      },
      {
        "SPEC_ID": "58411774",
        "SPEC_GROUP": [{
          "STATUS": 3,
          "COUNT": 1
        }]
      }
    ]
  },
  {
    "ASSIGN_ID": "583f84bce58725f76b322311",
    "ASSIGN_GROUP": [{
        "STATUS": 1,
        "COUNT": 1
      },
      {
        "STATUS": 3,
        "COUNT": 1
      }
    ],
    "SPEC_ARRAY": [{
      "SPEC_ID": "58411775",
      "SPEC_GROUP": [{
          "STATUS": 1,
          "COUNT": 1
        },
        {
          "STATUS": 3,
          "COUNT": 1
        }
      ]
    }]
  },
  {
    "ASSIGN_ID": "583f84bce58725f76b322322",
    "ASSIGN_GROUP": [{
        "STATUS": 1,
        "COUNT": 1
      },
      {
        "STATUS": 4,
        "COUNT": 1
      }
    ],
    "SPEC_ARRAY": [{
        "SPEC_ID": "58411774",
        "SPEC_GROUP": [{
          "STATUS": 1,
          "COUNT": 1
        }]
      },
      {
        "SPEC_ID": "58411778",
        "SPEC_GROUP": [{
          "STATUS": 4,
          "COUNT": 1
        }]
      }
    ]
  }
]

currently, what I did so far is just group the ASSIGN_ID and by STATUS please find the code below, 目前,我到目前为止所做的只是将ASSIGN_ID分组 ,按STATUS,请找到下面的代码,

Modal.aggregate([
  {
    "$group": {
      "_id": {
        "INSPECTED_BY": "$INSPECTED_BY",
        "STATUS": "$STATUS"
      },
      "spec_id": "$SPEC_ID",
      "total": {
        "$sum": 1
      }
    }
  }, {
    "$group": {
      "_id": "$_id.INSPECTED_BY",
      "data": {
        "$push": {
          "STATUS": "$_id.STATUS",
          "total": "$total"
        }
      }
    }
  }
]);

and the result is 结果是

[
  {
    "_id": "583f84bce58725f76b322398",
    "data": [
      {
        "STATUS": 1,
        "COUNT": 1
      }, {
        "STATUS": 3,
        "COUNT": 1
      }, {
        "STATUS": 4,
        "COUNT": 2
      }
    ]
  }, {
    "_id": "583f84bce58725f76b322311",
    "data": [
      {
        "STATUS": 1,
        "COUNT": 1
      }, {
        "STATUS": 3,
        "COUNT": 1
      }
    ]
  }, {
    "_id": "583f84bce58725f76b322322",
    "data": [
      {
        "STATUS": 1,
        "COUNT": 1
      }, {
        "STATUS": 4,
        "COUNT": 1
      }
    ]
  }
]

please, provide me a suitable solution get the expected result. 请为我提供合适的解决方案,以达到预期的效果。

You can try the alternative aggregation below for version 3.2. 您可以尝试以下3.2版的替代聚合。

Modal.aggregate([{
    $group: {
        _id: {
            ASSIGN_ID: "$ASSIGN_ID",
            SPEC_ID: "$SPEC_ID",
            STATUS: "$STATUS"
        },
        COUNT: {
            $sum: 1
        }
    }
}, {
    $group: {
        _id: {
            ASSIGN_ID: "$_id.ASSIGN_ID",
            SPEC_ID: "$_id.SPEC_ID"
        },
        SPEC_GROUP: {
            $push: {
                STATUS: "$_id.STATUS",
                COUNT: "$COUNT"
            }
        }
    }
}, {
    $group: {
        _id: "$_id.ASSIGN_ID",
        SPEC_ARRAY: {
            $push: {
                SPEC_ID: "$_id.SPEC_ID",
                SPEC_GROUP: "$SPEC_GROUP"
            }
        }
    }
}, {
    $project: {
        ASSIGN_ID: "$_id",
        ASSIGN_GROUP: "$SPEC_ARRAY.SPEC_GROUP",
        SPEC_ARRAY: 1
    }
}, {
    $unwind: "$ASSIGN_GROUP"
}, {
    $unwind: "$ASSIGN_GROUP"
}, {
    $group: {
        _id: "$ASSIGN_ID",
        ASSIGN_GROUP: {
            $push: "$ASSIGN_GROUP"
        },
        SPEC_ARRAY: {
            $first: "$SPEC_ARRAY"
        }
    }
}])

Replace last four stages with $reduce for version 3.4 将3.4版的$reduce替换为最后四个阶段

{
    $project: {
        _id: 0,
        ASSIGN_ID: "$_id",
        SPEC_ARRAY: 1,
        ASSIGN_GROUP: {
            $reduce: {
                input: "$SPEC_ARRAY.SPEC_GROUP",
                initialValue: [],
                in: {
                    $concatArrays: ["$$value", "$$this"]
                }
            }
        }
    }
}

It's a multi-pass pipeline; 这是一个多通道管道; if required to fetch two different sets of grouping within same pass; 如果需要在同一遍中获取两组不同的分组; will have to group for one set first. 首先必须分组。 Once that set is arrived, keep the data required for next set of grouping. 到达该组后,保留下一组分组所需的数据。

Pipeline involved: 涉及的管道:
group :(1) Group By ASSIGN_ID, SPEC_ID, STATUS - get the count for this combination group :(1)按ASSIGN_ID,SPEC_ID,STATUS分组-获取此组合的计数
group :(2) Group By ASSIGN_ID, SPEC_ID - prepare SPEC_GROUP Array group :(2)按ASSIGN_ID,SPEC_ID分组-准备SPEC_GROUP阵列
group :(3) Group By ASSIGN_ID - prepare SPEC_ARRAY Array of objects group :(3)按ASSIGN_ID分组-准备SPEC_ARRAY对象数组
project : Select ASSIGN_ID, SPEC_ARRAY, a copy of SPEC_ARRAY data for preparing grouping by STATUS project :选择ASSIGN_ID,SPEC_ARRAY,SPEC_ARRAY数据的副本以准备按STATUS进行分组
unwind : Unwind SPEC Array elements to get data for each spec_id separated unwindunwind SPEC数组元素以获取每个分隔的spec_id的数据
unwind : Unwind SPEC Array. unwindunwind SPEC阵列。 SPEC_GROUP elements to get data for each spec_id /status separated SPEC_GROUP元素获取每个单独的spec_id / status的数据
group :(4) Group By ASSIGN_ID,STATUS - get the count per status [When getting the count ADD counts corresponding to each status since we already grouped by SPEC_ID], select SPEC_ARRAY from first row as that is repeating all across group :(4)按ASSIGN_ID,STATUS分组-获取每个状态的计数[由于我们已经按SPEC_ID分组,因此当获取与每个状态相对应的计数ADD计数时,请从第一行中选择SPEC_ARRAY,因为这将重复
group :(5) Group By ASSIGN_ID - get the assign group array, select SPEC_ARRAY from first row as that is repeating all across group :(5)按ASSIGN_ID分组-获取分配组数组,从第一行中选择SPEC_ARRAY,因为这将重复

db.Modal.aggregate([ {
    $group : {
        _id : {
            ASSIGN_ID : "$ASSIGN_ID",
            SPEC_ID : "$SPEC_ID",
            STATUS : "$STATUS"
        },
        a_s_cnt : {
            $sum : 1
        }
    }
}, {
    $group : {
        _id : {
            ASSIGN_ID : "$_id.ASSIGN_ID",
            SPEC_ID : "$_id.SPEC_ID"
        },
        SPEC_GROUP : {
            $push : {
                STATUS : "$_id.STATUS",
                COUNT : "$a_s_cnt"
            }
        }
    }
}, {
    $group : {
        _id : "$_id.ASSIGN_ID",
        SPEC_ARRAY : {
            $push : {
                SPEC_ID : "$_id.SPEC_ID",
                SPEC_GROUP : "$SPEC_GROUP"
            }
        }
    }
}, {
    $project : {
        _id : 0,
        ASSIGN_ID : "$_id",
        SPEC_ARRAY : "$SPEC_ARRAY",
        forStatus : "$SPEC_ARRAY"
    }
}, {
    $unwind : "$forStatus"
}, {
    $unwind : "$forStatus.SPEC_GROUP"
}, {
    $group : {
        _id : {
            ASSIGN_ID : "$ASSIGN_ID",
            STATUS : "$forStatus.SPEC_GROUP.STATUS"
        },
        statusCount : {
            $sum : "$forStatus.SPEC_GROUP.COUNT"
        },
        SPEC_ARRAY : {
            $first : "$SPEC_ARRAY"
        }
    }
}, {
    $group : {
        _id : "$_id.ASSIGN_ID",
        ASSIGN_GROUP : {
            $push : {
                STATUS : "$_id.STATUS",
                COUNT : "$statusCount"
            }
        },
        SPEC_ARRAY : {
            $first : "$SPEC_ARRAY"
        }
    }
}, {
    $project : {
        _id : 0,
        ASSIGN_ID : "$_id",
        ASSIGN_GROUP : "$ASSIGN_GROUP",
        SPEC_ARRAY : "$SPEC_ARRAY"
    }
} ])

Use This Aggregate Command, Tested with your Sample data, 使用此汇总命令,并通过示例数据进行测试,

        db.test.aggregate([{
    $group: {
        _id: {
            ASSIGN_ID: "$ASSIGN_ID",
            STATUS: "$STATUS",
            SPEC_ID: "$SPEC_ID"
        },
        count: {
            "$sum": 1
        }
    }
}, {
    $group: {
        _id: "$_id.ASSIGN_ID",
        ASSIGN_GROUP: {
            $push: {
                STATUS: "$_id.STATUS",
                count: "$count"
            }
        },
        SPEC_ARRAY: {
            $push: {
                SPEC_ID: "$_id.SPEC_ID",
                STATUS: "$_id.STATUS",
                count: "$count"
            }
        }
    }
}, {
    $unwind: "$SPEC_ARRAY"
}, {
    $group: {
        _id: {
            ASSIGN_ID: "$_id",
            SPEC_ID: "$SPEC_ARRAY.SPEC_ID"
        },
        ASSIGN_GROUP: {
            $first: "$ASSIGN_GROUP"
        },
        SPEC_GROUP: {
            $push: {
                "STATUS": "$SPEC_ARRAY.STATUS",
                count: "$SPEC_ARRAY.count"
            }
        }
    }
}, {
    $group: {
        _id: "$_id.ASSIGN_ID",
        ASSIGN_GROUP: {
            $first: "$ASSIGN_GROUP"
        },
        SPEC_ARRAY: {
            $push: {
                SPEC_ID: "$_id.SPEC_ID",
                SPEC_GROUP: "$SPEC_GROUP"
            }
        }
    }
}

]).pretty()

声明:本站的技术帖子网页,遵循CC BY-SA 4.0协议,如果您需要转载,请注明本站网址或者原文地址。任何问题请咨询:yoyou2525@163.com.

 
粤ICP备18138465号  © 2020-2024 STACKOOM.COM