尝试读取BigQuery表中的JSON结构时出错
下面是我试图阅读的JSON以及供您阅读的代码: 我只是在阅读“fieldorders”部分时遇到了问题,因为它没有任何值。如果它没有任何结构,我仍然需要向它们显示空白值。我能够阅读其他几个有多个部分的对象,没有任何问题。当我们有一个没有任何值的对象时,我有一个问题,我需要只放置空值,以防我在该对象中找不到任何值尝试读取BigQuery表中的JSON结构时出错,json,google-bigquery,Json,Google Bigquery,下面是我试图阅读的JSON以及供您阅读的代码: 我只是在阅读“fieldorders”部分时遇到了问题,因为它没有任何值。如果它没有任何结构,我仍然需要向它们显示空白值。我能够阅读其他几个有多个部分的对象,没有任何问题。当我们有一个没有任何值的对象时,我有一个问题,我需要只放置空值,以防我在该对象中找不到任何值 Getting the below Error: **Failed to coerce output value false to type ARRAY** 我用于读取数据的示例JS
Getting the below Error:
**Failed to coerce output value false to type ARRAY**
我用于读取数据的示例JSON文件:
{
"projectnumber": "X.6001877",
"operationnumber": "O.6001877.01",
"opactivitynumber": "B.6001877.01.01",
"jobtypes": null,
"jobtypesinfo": [
{
"jobtype": "CC-SERV",
"jobgroup": "CPS-CC",
"staticattributes": [
{
"name": "OAJTOPT",
"description": "OA Job Type OPT",
"type": "Double",
"value": 0.0,
"uom": null
}
]
}
],
"actualactivitystartdate": "2018-01-17T05:00:00",
"actualactivityenddate": "2018-01-29T05:00:00",
"serverdatetime": null,
"ServerDateTime": "2019-01-20T16:36:48.106",
"projectSettings": null,
"customerContacts": null,
"actualequipments": null,
"welldetails": [
{
"Number": "1-1IH",
"Name": "XXXX 58-4X",
"State": "PL",
"Country": "Col",
"Field": "LABCD",
"Uwi": null,
"Environment": "Land",
"WellId": "0065",
"Latitude": 3.8,
"Longitude": -72.2,
"Type": null,
"WaterDepth": null,
"WellPlaceholderId": null,
"IsNonMasteredWell": false
}
],
"lastopeventid": null,
"personnelassignmentinfo": null,
"status": null,
"accountingunit": null,
"erpsystem": "ITT",
"CreatedDate": "2020-01-20T16:36:48.106",
"CreatedBy": "ABCD11",
"LastModifiedDate": "2020-01-20T16:36:48.106",
"LastModifiedBy": "ABCD11",
"Id": "A.6001877.01.01",
"country": {
"Code": "CO",
"Name": "CoOOOOOO"
},
"attributes": {
"Attributes": [
{
"AttributeName": "OAOPDXAS",
"AttributeDescription": "Activity OPD",
"DataType": "Integer",
"UOMType": "Dimensionless",
"BaseUnit": "",
"IsCalculated": true,
"Values": null
},
{
"AttributeName": "OpActOPTime",
"AttributeDescription": "OA Operating Time - OPT (HRS)",
"DataType": "Float",
"UOMType": "Dimensionless",
"BaseUnit": "",
"IsCalculated": true,
"Values": null
}
],
"DailyAttributes": null,
"MultiAttributes": null,
"Id": "A.6001877.01.01"
},
"operationalevent": [
{
"operatingevent": {
"projectnumber": "C.6001877",
"operationnumber": "O.6001877.01",
"operationactivitynumber": "X.6001877.01.01",
"operationaleventdetails": {
"status": null,
"description": "Non-Operational Event",
"plannedeventid": null,
"jobgroup": null,
"jobtype": null,
"startdatetime": "2020-01-18T05:00:00",
"enddatetime": "2020-01-15T05:00:00",
"comments": "Non-Operational Event",
"eventtype": "Project",
"isdeleted": false,
"category": "NonOperational",
"islocked": false,
"lockedon": "0001-01-01T05:00:00",
"lockedby": null,
"audittrailinfo": {
"CreatedDate": "2020-01-20T15:36:17.816",
"CreatedBy": "ABCD11",
"LastModifiedDate": "2020-01-20T15:36:17.816",
"LastModifiedBy": "ABCD1111",
"Id": null
},
"personnel": {
"assignment": [
]
},
"serverdatetime": "2018-01-20T16:36:56.185",
"equipmentdata": {
"equipmentassignments": [
]
},
"eventtypeattributes": null,
"id": "E97A5DBC",
"oesummary": null,
"journal": null,
"well": null,
"isactive": true,
"externaltransactionhistoryinfo": [
{
"status": "Pending",
"message": null,
"type": "MPT",
"riteservicereporturl": null,
"CreatedDate": "0001-01-01T00:00:00",
"CreatedBy": null,
"LastModifiedDate": "0001-01-01T00:00:00",
"LastModifiedBy": null,
"Id": null
}
],
"pnmconsumptiondata": {
"pnmconsumptions": [
]
}
},
"CreatedDate": "2018-01-20T16:36:56.185",
"CreatedBy": "ABCD11",
"LastModifiedDate": "2020-01-20T16:36:56.185",
"LastModifiedBy": "ABCD11",
"Id": "A.6001877.01.01_OperationalEvent_E97A5DBC"
},
"attributes": null
}
],
"attendance": [
],
**"fieldorders": [
]**
}
BigQuery SQL代码:
CREATE TEMPORARY FUNCTION CUSTOM_JSON_EXTRACT(json STRING, json_path STRING)
RETURNS ARRAY<STRING>
LANGUAGE js AS """
return jsonPath(JSON.parse(json), json_path);
"""
OPTIONS (
library="gs://json_temp/jsonpath-0.8.0.js"
);
SELECT job_id,oe_descr,
attr_name,
well_name,
job_type,
--field_id
from lz.json_actuals,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.operationalevent[*].operatingevent.operationaleventdetails.description')) oe_descr with offset oedescr,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.attributes.Attributes[*].AttributeName')) attr_name with offset attrb,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.welldetails[*].Name')) Well_name with offset wll,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.jobtypesinfo[*].jobtype')) job_type with offset jt,
--UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.fieldorders[*].id')) field_id WITH OFFSET fld
;
创建临时函数CUSTOM_JSON_EXTRACT(JSON字符串,JSON_路径字符串)
返回数组
语言js为“”
返回jsonPath(JSON.parse(JSON),JSON_path);
"""
选择权(
library=“gs://json\u temp/jsonpath-0.8.0.js”
);
选择作业id、oe描述、,
属性名称,
嗯,你的名字,
工作类型,
--字段id
从lz.json_实际值,
UNNEST(自定义JSON提取(conv_列,'$.operationalevent[*].operationalevent.operationaleventdetails.description'))带有偏移量oedescr的oe描述,
UNNEST(自定义的JSON提取(conv_列,'$.attributes.attributes[*].AttributeName'))attr_名称和偏移量attrb,
UNNEST(自定义_JSON_提取(conv_列,'$.welldetails[*].Name'))带有偏移量wll的井名称,
UNNEST(自定义JSON提取(conv_列,'$.jobtypesinfo[*].jobtype'))带有偏移量jt的作业类型,
--UNNEST(自定义_JSON_提取(conv_列,'$.fieldorders[*].id'))字段_id和偏移量fld
;
下面是BigQuery标准SQL,应该可以解决空对象的问题
#standardSQL
CREATE TEMPORARY FUNCTION CUSTOM_JSON_EXTRACT(json STRING, json_path STRING)
RETURNS ARRAY<string>
LANGUAGE js AS """
var result = jsonPath(JSON.parse(json), json_path);
if(result){return result;}
else {return [];}
"""
OPTIONS (
library="gs://json_temp/jsonpath-0.8.0.js"
);
SELECT --job_id,
oe_descr,
attr_name,
well_name,
job_type,
field_id
from `lz.json_actuals`,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.operationalevent[*].operatingevent.operationaleventdetails.description')) oe_descr with offset oedescr,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.attributes.Attributes[*].AttributeName')) attr_name with offset attrb,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.welldetails[*].Name')) Well_name with offset wll,
UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.jobtypesinfo[*].jobtype')) job_type with offset jt
LEFT JOIN UNNEST(CUSTOM_JSON_EXTRACT(conv_column, '$.fieldorders[*].id')) field_id WITH OFFSET fld
仅仅说您无法针对您的具体案例采用其他解决方案并没有帮助-您应该提供所有相关细节!非常感谢你的回复,米哈伊尔。我将举例说明它在哪里起作用,在哪里不起作用。你应该用你想问的问题的所有细节更新你的问题。而不是张贴图片,你应该张贴文本,这样我们可以发挥你的数据和复制您的用例,最重要的是将能够帮助你@MikhailBerlyant——我试图以文本的形式发布我的问题,并提供了在BigQuery中执行的示例json和代码iam。看起来版主正在删除它们,我不确定我是否违反了此处的任何策略。请请求您的帮助来指导我,而不是发布您问题的答案-您应该更新您的问题。非常感谢您在这方面的帮助。这解决了我的问题。对于所有字段,我都使用了左联接,因为我们可能会遇到任何列的空白数组并测试它,它工作得很好。
Row oe_descr attr_name well_name job_type field_id
1 Non-Operational Event OAOPDXAS XXXX 58-4X CC-SERV null
2 Non-Operational Event OpActOPTime XXXX 58-4X CC-SERV null