尝试读取BigQuery表中的JSON结构时出错

尝试读取BigQuery表中的JSON结构时出错,json,google-bigquery,Json,Google Bigquery,下面是我试图阅读的JSON以及供您阅读的代码: 我只是在阅读“fieldorders”部分时遇到了问题,因为它没有任何值。如果它没有任何结构,我仍然需要向它们显示空白值。我能够阅读其他几个有多个部分的对象,没有任何问题。当我们有一个没有任何值的对象时,我有一个问题,我需要只放置空值,以防我在该对象中找不到任何值 Getting the below Error: **Failed to coerce output value false to type ARRAY** 我用于读取数据的示例JS

下面是我试图阅读的JSON以及供您阅读的代码:

我只是在阅读“fieldorders”部分时遇到了问题,因为它没有任何值。如果它没有任何结构,我仍然需要向它们显示空白值。我能够阅读其他几个有多个部分的对象,没有任何问题。当我们有一个没有任何值的对象时,我有一个问题,我需要只放置空值,以防我在该对象中找不到任何值

Getting the below Error:

**Failed to coerce output value false to type ARRAY**
我用于读取数据的示例JSON文件:

{
  "projectnumber": "X.6001877",
  "operationnumber": "O.6001877.01",
  "opactivitynumber": "B.6001877.01.01",
  "jobtypes": null,
  "jobtypesinfo": [
    {
      "jobtype": "CC-SERV",
      "jobgroup": "CPS-CC",
      "staticattributes": [
        {
          "name": "OAJTOPT",
          "description": "OA Job Type OPT",
          "type": "Double",
          "value": 0.0,
          "uom": null
        }
      ]
    }
  ],
  "actualactivitystartdate": "2018-01-17T05:00:00",
  "actualactivityenddate": "2018-01-29T05:00:00",
  "serverdatetime": null,
  "ServerDateTime": "2019-01-20T16:36:48.106",
  "projectSettings": null,
  "customerContacts": null,
  "actualequipments": null,
  "welldetails": [
    {
      "Number": "1-1IH",
      "Name": "XXXX 58-4X",
      "State": "PL",
      "Country": "Col",
      "Field": "LABCD",
      "Uwi": null,
      "Environment": "Land",
      "WellId": "0065",
      "Latitude": 3.8,
      "Longitude": -72.2,
      "Type": null,
      "WaterDepth": null,
      "WellPlaceholderId": null,
      "IsNonMasteredWell": false
    }
  ],
  "lastopeventid": null,
  "personnelassignmentinfo": null,
  "status": null,
  "accountingunit": null,
  "erpsystem": "ITT",
  "CreatedDate": "2020-01-20T16:36:48.106",
  "CreatedBy": "ABCD11",
  "LastModifiedDate": "2020-01-20T16:36:48.106",
  "LastModifiedBy": "ABCD11",
  "Id": "A.6001877.01.01",
  "country": {
    "Code": "CO",
    "Name": "CoOOOOOO"
  },
  "attributes": {
    "Attributes": [
      {
        "AttributeName": "OAOPDXAS",
        "AttributeDescription": "Activity OPD",
        "DataType": "Integer",
        "UOMType": "Dimensionless",
        "BaseUnit": "",
        "IsCalculated": true,
        "Values": null
      },
      {
        "AttributeName": "OpActOPTime",
        "AttributeDescription": "OA Operating Time - OPT (HRS)",
        "DataType": "Float",
        "UOMType": "Dimensionless",
        "BaseUnit": "",
        "IsCalculated": true,
        "Values": null
      }
    ],
    "DailyAttributes": null,
    "MultiAttributes": null,
    "Id": "A.6001877.01.01"
  },
  "operationalevent": [
    {
      "operatingevent": {
        "projectnumber": "C.6001877",
        "operationnumber": "O.6001877.01",
        "operationactivitynumber": "X.6001877.01.01",
        "operationaleventdetails": {
          "status": null,
          "description": "Non-Operational Event",
          "plannedeventid": null,
          "jobgroup": null,
          "jobtype": null,
          "startdatetime": "2020-01-18T05:00:00",
          "enddatetime": "2020-01-15T05:00:00",
          "comments": "Non-Operational Event",
          "eventtype": "Project",
          "isdeleted": false,
          "category": "NonOperational",
          "islocked": false,
          "lockedon": "0001-01-01T05:00:00",
          "lockedby": null,
          "audittrailinfo": {
            "CreatedDate": "2020-01-20T15:36:17.816",
            "CreatedBy": "ABCD11",
            "LastModifiedDate": "2020-01-20T15:36:17.816",
            "LastModifiedBy": "ABCD1111",
            "Id": null
          },
          "personnel": {
            "assignment": [

            ]
          },
          "serverdatetime": "2018-01-20T16:36:56.185",
          "equipmentdata": {
            "equipmentassignments": [

            ]
          },
          "eventtypeattributes": null,
          "id": "E97A5DBC",
          "oesummary": null,
          "journal": null,
          "well": null,
          "isactive": true,
          "externaltransactionhistoryinfo": [
            {
              "status": "Pending",
              "message": null,
              "type": "MPT",
              "riteservicereporturl": null,
              "CreatedDate": "0001-01-01T00:00:00",
              "CreatedBy": null,
              "LastModifiedDate": "0001-01-01T00:00:00",
              "LastModifiedBy": null,
              "Id": null
            }
          ],
          "pnmconsumptiondata": {
            "pnmconsumptions": [

            ]
          }
        },
        "CreatedDate": "2018-01-20T16:36:56.185",
        "CreatedBy": "ABCD11",
        "LastModifiedDate": "2020-01-20T16:36:56.185",
        "LastModifiedBy": "ABCD11",
        "Id": "A.6001877.01.01_OperationalEvent_E97A5DBC"
      },
      "attributes": null
    }
  ],
  "attendance": [

  ],
  **"fieldorders": [

  ]**
}
BigQuery SQL代码:

    CREATE TEMPORARY FUNCTION CUSTOM_JSON_EXTRACT(json STRING, json_path STRING)
    RETURNS ARRAY<STRING>
    LANGUAGE js AS """
            return jsonPath(JSON.parse(json), json_path);
    """
    OPTIONS (
        library="gs://json_temp/jsonpath-0.8.0.js"
    );

    SELECT job_id,oe_descr,
    attr_name,
    well_name,
    job_type,
    --field_id

    from lz.json_actuals,
    UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.operationalevent[*].operatingevent.operationaleventdetails.description')) oe_descr  with offset oedescr,
    UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.attributes.Attributes[*].AttributeName')) attr_name with offset attrb,
    UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.welldetails[*].Name')) Well_name with offset wll,
    UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.jobtypesinfo[*].jobtype')) job_type with offset jt,
    --UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.fieldorders[*].id')) field_id WITH OFFSET fld

  ;
创建临时函数CUSTOM_JSON_EXTRACT(JSON字符串,JSON_路径字符串)
返回数组
语言js为“”
返回jsonPath(JSON.parse(JSON),JSON_path);
"""
选择权(
library=“gs://json\u temp/jsonpath-0.8.0.js”
);
选择作业id、oe描述、,
属性名称,
嗯,你的名字,
工作类型,
--字段id
从lz.json_实际值,
UNNEST(自定义JSON提取(conv_列,'$.operationalevent[*].operationalevent.operationaleventdetails.description'))带有偏移量oedescr的oe描述,
UNNEST(自定义的JSON提取(conv_列,'$.attributes.attributes[*].AttributeName'))attr_名称和偏移量attrb,
UNNEST(自定义_JSON_提取(conv_列,'$.welldetails[*].Name'))带有偏移量wll的井名称,
UNNEST(自定义JSON提取(conv_列,'$.jobtypesinfo[*].jobtype'))带有偏移量jt的作业类型,
--UNNEST(自定义_JSON_提取(conv_列,'$.fieldorders[*].id'))字段_id和偏移量fld
;

下面是BigQuery标准SQL,应该可以解决空对象的问题

#standardSQL
CREATE TEMPORARY FUNCTION CUSTOM_JSON_EXTRACT(json STRING, json_path STRING)
RETURNS ARRAY<string>
LANGUAGE js AS """
  var result = jsonPath(JSON.parse(json), json_path);
  if(result){return result;} 
  else {return [];}
"""
OPTIONS (
    library="gs://json_temp/jsonpath-0.8.0.js"
);
SELECT --job_id,
  oe_descr,
  attr_name,
  well_name,
  job_type,
  field_id
from `lz.json_actuals`,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.operationalevent[*].operatingevent.operationaleventdetails.description')) oe_descr  with offset oedescr,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.attributes.Attributes[*].AttributeName')) attr_name with offset attrb,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.welldetails[*].Name')) Well_name with offset wll,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.jobtypesinfo[*].jobtype')) job_type with offset jt
LEFT JOIN UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.fieldorders[*].id')) field_id WITH OFFSET fld   

仅仅说您无法针对您的具体案例采用其他解决方案并没有帮助-您应该提供所有相关细节!非常感谢你的回复,米哈伊尔。我将举例说明它在哪里起作用,在哪里不起作用。你应该用你想问的问题的所有细节更新你的问题。而不是张贴图片,你应该张贴文本,这样我们可以发挥你的数据和复制您的用例,最重要的是将能够帮助你@MikhailBerlyant——我试图以文本的形式发布我的问题,并提供了在BigQuery中执行的示例json和代码iam。看起来版主正在删除它们,我不确定我是否违反了此处的任何策略。请请求您的帮助来指导我,而不是发布您问题的答案-您应该更新您的问题。非常感谢您在这方面的帮助。这解决了我的问题。对于所有字段,我都使用了左联接,因为我们可能会遇到任何列的空白数组并测试它,它工作得很好。
Row oe_descr                    attr_name   well_name   job_type    field_id     
1   Non-Operational Event       OAOPDXAS    XXXX 58-4X  CC-SERV     null     
2   Non-Operational Event       OpActOPTime XXXX 58-4X  CC-SERV     null