in athena_glue_service_logs/cloudtrail.py [0:0]
def _build_storage_descriptor(self, partition_values=None):
if partition_values is None:
partition_values = []
return {
"Columns": [
{
"Type": "string",
"Name": "eventversion"
},
{
"Type": "string",
"Name": "json_useridentity"
},
{
"Type": "timestamp",
"Name": "eventtime"
},
{
"Type": "string",
"Name": "eventsource"
},
{
"Type": "string",
"Name": "eventname"
},
{
"Type": "string",
"Name": "awsregion"
},
{
"Type": "string",
"Name": "sourceipaddress"
},
{
"Type": "string",
"Name": "useragent"
},
{
"Type": "string",
"Name": "json_requestparameters"
},
{
"Type": "string",
"Name": "json_responseelements"
},
{
"Type": "string",
"Name": "requestid"
},
{
"Type": "string",
"Name": "eventid"
},
{
"Type": "string",
"Name": "eventtype"
},
{
"Type": "string",
"Name": "recipientaccountid"
},
{
"Type": "string",
"Name": "errorcode"
},
{
"Type": "string",
"Name": "errormessage"
},
{
"Type": "string",
"Name": "apiversion"
},
{
"Type": "string",
"Name": "json_additionaleventdata"
},
{
"Type": "string",
"Name": "vpcendpointid"
},
{
"Type": "boolean",
"Name": "readonly"
},
{
"Type": "array<struct<arn:string,accountid:string,type:string>>",
"Name": "resources"
}
],
"Location": self.partitioner.build_partitioned_path(partition_values),
"InputFormat": "org.apache.hadoop.hive.ql.io.parquet.MapredParquetInputFormat",
"OutputFormat": "org.apache.hadoop.hive.ql.io.HiveIgnoreKeyTextOutputFormat",
"SerdeInfo": {
"SerializationLibrary": "org.apache.hadoop.hive.ql.io.parquet.serde.ParquetHiveSerDe",
"Parameters": {}
},
"BucketColumns": [], # Required or SHOW CREATE TABLE fails
"Parameters": {} # Required or create_dynamic_frame.from_catalog fails for partitions
}