Parquet Parser
7 min
this connector reads in a parquet file and converts it into a json object, which can then be ingested by downstream applications metadata sample metadata returned "metadata" { "num rows" 156, "num columns" 20, "column names" \[ "metadata", "cloud", "src endpoint", "dst endpoint", "connection info", "traffic", "time", "start time", "end time", "severity id", "severity", "class name", "class uid", "category name", "category uid", "activity name", "activity id", "type uid", "type name", "unmapped" ], "column types" { "metadata" "object", "cloud" "object", "src endpoint" "object", "dst endpoint" "object", "connection info" "object", "traffic" "object", "time" "int64", "start time" "int64", "end time" "int64", "severity id" "int32", "severity" "object", "class name" "object", "class uid" "int32", "category name" "object", "category uid" "int32", "activity name" "object", "activity id" "int32", "type uid" "int32", "type name" "object", "unmapped" "object" }, "memory usage" 279461, "describe" { "time" \[ 156 0, 1678822323576 923, 92110 1751558733, 1678822108000 0, 1678822249500 0, 1678822323000 0, 1678822398750 0, 1678822494000 0 ], "start time" \[ 156 0, 1678822323576 923, 92110 1751558733, 1678822108000 0, 1678822249500 0, 1678822323000 0, 1678822398750 0, 1678822494000 0 ], "end time" \[ 156 0, 1678822342006 4102, 91207 1372981708, 1678822139000 0, 1678822270750 0, 1678822335000 0, 1678822420000 0, 1678822503000 0 ], "severity id" \[ 156 0, 1 0, 0 0, 1 0, 1 0, 1 0, 1 0, 1 0 ], "class uid" \[ 156 0, 4001 0, 0 0, 4001 0, 4001 0, 4001 0, 4001 0, 4001 0 ], "category uid" \[ 156 0, 4 0, 0 0, 4 0, 4 0, 4 0, 4 0, 4 0 ], "activity id" \[ 156 0, 0 5064102564102564, 0 5015690847060224, 0 0, 0 0, 1 0, 1 0, 1 0 ], "type uid" \[ 156 0, 400100 50641025644, 0 5015690847060224, 400100 0, 400100 0, 400101 0, 400101 0, 400101 0 ] } }, actions parse parquet parse a parquet file endpoint method get input argument name type required description metadata boolean optional include metadata attachments array required file to be analysed attachments file string optional parameter for parse parquet attachments file name string optional name of the resource input example {"metadata"\ true,"attachments" \[{"file" "string","file name" "example name"}]} output parameter type description metadata object response data metadata num rows number response data metadata num columns number response data metadata column names array response data metadata column types object response data metadata column types metadata string response data metadata column types cloud string response data metadata column types src endpoint string response data metadata column types dst endpoint string response data metadata column types connection info string response data metadata column types traffic string response data metadata column types time string response data metadata column types start time string response data metadata column types end time string response data metadata column types severity id string response data metadata column types severity string response data metadata column types class name string response data metadata column types class uid string response data metadata column types category name string response data metadata column types category uid string response data metadata column types activity name string response data metadata column types activity id string response data metadata column types type uid string response data metadata column types type name string response data metadata column types unmapped string response data output example {"metadata" {"num rows" 156,"num columns" 20,"column names" \["metadata","cloud","src endpoint"],"column types" {"metadata" "object","cloud" "object","src endpoint" "object","dst endpoint" "object","connection info" "object","traffic" "object","time" "int64","start time" "int64","end time" "int64","severity id" "int32","severity" "object","class name" "object","class uid" "int32","category name" "object","category uid" "int32"},"memory usage" 279461,"describe" {"time" \[],"start time" \[],"end time response headers header description example content type the media type of the resource application/json date the date and time at which the message was originated thu, 01 jan 2024 00 00 00 gmt