JSON 转换的 U-SQL 脚本
U-SQL script for JSON's transformation
我有多个级别的 JSON 文件,需要在 Azure Data Lake Analytics 中对其进行转换,以从 "vin" 级别(包括)
开始获取所有数据
截取的json为:
"vehicleStatusResponse": {
"vehicleStatuses": [
{
"vin": "ABC1234567890",
"triggerType": {
"triggerType": "TIMER",
"context": "RFMS",
"driverId": {
"tachoDriverIdentification": {
"driverIdentification": "123456789",
"cardIssuingMemberState": "BRA",
"driverAuthenticationEquipment": "CARD",
"cardReplacementIndex": "0",
"cardRenewalIndex": "1"
}
}
},
"receivedDateTime": "2020-02-12T04:11:19.221Z",
"hrTotalVehicleDistance": 103306960,
"totalEngineHours": 3966.6216666666664,
"driver1Id": {
"tachoDriverIdentification": {
"driverIdentification": "BRA1234567"
}
},
"engineTotalFuelUsed": 48477520,
"accumulatedData": {
"durationWheelbaseSpeedOverZero": 8309713,
"distanceCruiseControlActive": 8612200,
"durationCruiseControlActive": 366083,
"fuelConsumptionDuringCruiseActive": 3064170,
"durationWheelbaseSpeedZero": 5425783,
"fuelWheelbaseSpeedZero": 3332540,
"fuelWheelbaseSpeedOverZero": 44709670,
"ptoActiveClass": [
{
"label": "wheelbased speed >0",
"seconds": 16610,
"meters": 29050,
"milliLitres": 26310
},
{
"label": "wheelbased speed =0",
"seconds": 457344,
"milliLitres": 363350
这个案例有一个脚本:
CREATE ASSEMBLY IF NOT EXISTS [Newtonsoft.Json] FROM "adl://#####.azuredatalakestore.net/Newtonsoft.Json.dll";
CREATE ASSEMBLY IF NOT EXISTS [Microsoft.Analytics.Samples.Formats] FROM "adl://#####.azuredatalakestore.net/Microsoft.Analytics.Samples.Formats.dll";
REFERENCE ASSEMBLY [Newtonsoft.Json];
REFERENCE ASSEMBLY [Microsoft.Analytics.Samples.Formats];
USING Microsoft.Analytics.Samples.Formats.Json;
DECLARE @InputFile string = "response.json";
DECLARE @OutputFile string = "response.csv";
@json =
EXTRACT
vin string,
triggerType string,
driverIdentification string,
receivedDateTime DateTime,
hrTotalVehicleDistance int,
totalEngineHours float,
engineTotalFuelUsed int,
durationWheelbaseSpeedOverZero int,
distanceCruiseControlActive int,
durationCruiseControlActive int,
fuelConsumptionDuringCruiseActive int,
durationWheelbaseSpeedZero int,
fuelWheelbaseSpeedZero int
ptoActiveClass string
label string
seconds int
meters int
millilitres int
FROM
@InputFile
USING new MultiLevelJsonExtractor("vehicleStatusResponse.vehicleStatuses.vin[*]",
true,
"vin",
"triggerType",
"driverIdentification",
"receivedDateTime",
"hrTotalVehicleDistance",
"totalEngineHours",
"engineTotalFuelUsed",
"durationWheelbaseSpeedOverZero",
"distanceCruiseControlActive",
"durationCruiseControlActive",
"fuelConsumptionDuringCruiseActive",
"durationWheelbaseSpeedZero",
"fuelWheelbaseSpeedZero",
"ptoActiveClass",
"label",
"seconds",
"meters",
"millilitres"
);
@new =
SELECT
vin,
triggerType,
driverIdentification,
receivedDateTime,
hrTotalVehicleDistance,
totalEngineHours,
engineTotalFuelUsed,
durationWheelbaseSpeedOverZero,
distanceCruiseControlActive,
durationCruiseControlActive,
fuelConsumptionDuringCruiseActive,
durationWheelbaseSpeedZero,
fuelWheelbaseSpeedZero,
ptoActiveClass,
label,
seconds,
meters,
millilitres
FROM @json;
OUTPUT @new
TO @OutputFile
USING Outputters.Csv();
无论如何,我只得到空白 response.csv,没有任何数据。我的脚本有什么问题?如果您有其他方法来转换分层 json 数据,将会很有趣。
您没有正确提取 JSON。您需要像这样使用它:
FROM
@InputFile
USING new MultiLevelJsonExtractor("vehicleStatusResponse.vehicleStatuses.vin[*]",
true,
"tachoDriverIdentification.driverIdentification"
);
您可以使用 U-SQL
here.
阅读更多关于 JSON 高级 JSON 操作的信息
我有多个级别的 JSON 文件,需要在 Azure Data Lake Analytics 中对其进行转换,以从 "vin" 级别(包括)
开始获取所有数据截取的json为:
"vehicleStatusResponse": {
"vehicleStatuses": [
{
"vin": "ABC1234567890",
"triggerType": {
"triggerType": "TIMER",
"context": "RFMS",
"driverId": {
"tachoDriverIdentification": {
"driverIdentification": "123456789",
"cardIssuingMemberState": "BRA",
"driverAuthenticationEquipment": "CARD",
"cardReplacementIndex": "0",
"cardRenewalIndex": "1"
}
}
},
"receivedDateTime": "2020-02-12T04:11:19.221Z",
"hrTotalVehicleDistance": 103306960,
"totalEngineHours": 3966.6216666666664,
"driver1Id": {
"tachoDriverIdentification": {
"driverIdentification": "BRA1234567"
}
},
"engineTotalFuelUsed": 48477520,
"accumulatedData": {
"durationWheelbaseSpeedOverZero": 8309713,
"distanceCruiseControlActive": 8612200,
"durationCruiseControlActive": 366083,
"fuelConsumptionDuringCruiseActive": 3064170,
"durationWheelbaseSpeedZero": 5425783,
"fuelWheelbaseSpeedZero": 3332540,
"fuelWheelbaseSpeedOverZero": 44709670,
"ptoActiveClass": [
{
"label": "wheelbased speed >0",
"seconds": 16610,
"meters": 29050,
"milliLitres": 26310
},
{
"label": "wheelbased speed =0",
"seconds": 457344,
"milliLitres": 363350
这个案例有一个脚本:
CREATE ASSEMBLY IF NOT EXISTS [Newtonsoft.Json] FROM "adl://#####.azuredatalakestore.net/Newtonsoft.Json.dll";
CREATE ASSEMBLY IF NOT EXISTS [Microsoft.Analytics.Samples.Formats] FROM "adl://#####.azuredatalakestore.net/Microsoft.Analytics.Samples.Formats.dll";
REFERENCE ASSEMBLY [Newtonsoft.Json];
REFERENCE ASSEMBLY [Microsoft.Analytics.Samples.Formats];
USING Microsoft.Analytics.Samples.Formats.Json;
DECLARE @InputFile string = "response.json";
DECLARE @OutputFile string = "response.csv";
@json =
EXTRACT
vin string,
triggerType string,
driverIdentification string,
receivedDateTime DateTime,
hrTotalVehicleDistance int,
totalEngineHours float,
engineTotalFuelUsed int,
durationWheelbaseSpeedOverZero int,
distanceCruiseControlActive int,
durationCruiseControlActive int,
fuelConsumptionDuringCruiseActive int,
durationWheelbaseSpeedZero int,
fuelWheelbaseSpeedZero int
ptoActiveClass string
label string
seconds int
meters int
millilitres int
FROM
@InputFile
USING new MultiLevelJsonExtractor("vehicleStatusResponse.vehicleStatuses.vin[*]",
true,
"vin",
"triggerType",
"driverIdentification",
"receivedDateTime",
"hrTotalVehicleDistance",
"totalEngineHours",
"engineTotalFuelUsed",
"durationWheelbaseSpeedOverZero",
"distanceCruiseControlActive",
"durationCruiseControlActive",
"fuelConsumptionDuringCruiseActive",
"durationWheelbaseSpeedZero",
"fuelWheelbaseSpeedZero",
"ptoActiveClass",
"label",
"seconds",
"meters",
"millilitres"
);
@new =
SELECT
vin,
triggerType,
driverIdentification,
receivedDateTime,
hrTotalVehicleDistance,
totalEngineHours,
engineTotalFuelUsed,
durationWheelbaseSpeedOverZero,
distanceCruiseControlActive,
durationCruiseControlActive,
fuelConsumptionDuringCruiseActive,
durationWheelbaseSpeedZero,
fuelWheelbaseSpeedZero,
ptoActiveClass,
label,
seconds,
meters,
millilitres
FROM @json;
OUTPUT @new
TO @OutputFile
USING Outputters.Csv();
无论如何,我只得到空白 response.csv,没有任何数据。我的脚本有什么问题?如果您有其他方法来转换分层 json 数据,将会很有趣。
您没有正确提取 JSON。您需要像这样使用它:
FROM
@InputFile
USING new MultiLevelJsonExtractor("vehicleStatusResponse.vehicleStatuses.vin[*]",
true,
"tachoDriverIdentification.driverIdentification"
);
您可以使用 U-SQL
here.