in rawdataprocessor/RawDataProcesser.py [0:0]
def writePreparedDataForModel(mconfig):
logger.debug(mconfig)
#The dataset group name must have 1 to 63 characters. Valid characters: a-z, A-Z, 0-9, and _
datasetGroupName = mconfig["modelName"]+"_"+tranformDateToString(vars.StartDate).replace("-","")+"_"+tranformDateToString(vars.EndDate).replace("-","")
FullHistoryTargetFileName="history.target."+tranformDateToString(vars.StartDate)+"."+ tranformDateToString(vars.EndDate)+".csv"
FullHistoryRelatedFileName="history.related."+tranformDateToString(vars.StartDate)+"."+ tranformDateToString(vars.EndDate)+".csv"
modelconfigfile= "/tmp/"+datasetGroupName+".json"
simulateStartDate=vars.EndDate+timedelta(days=1)
simulateEndDate=vars.EndDate+timedelta(days=mconfig["preditor"]["ForecastHorizon"])
with open(modelconfigfile, 'w') as outfile:
mconfig["data_starttime"]= tranformDateToString(vars.StartDate)
mconfig["data_endtime"]= tranformDateToString(vars.EndDate)
mconfig["forecast_starttime"]= tranformDateToString(simulateStartDate)
mconfig["forecast_endtime"]= tranformDateToString(simulateEndDate)
json.dump(mconfig, outfile)
s3_client.upload_file(modelconfigfile, S3BucketName, "DatasetGroups/"+datasetGroupName+"/config.json")
logger.info("Dataset Group config config.json uploaded to bucket="+S3BucketName+", under path key=DatasetGroups/"+datasetGroupName)
targetFile = open("/tmp/"+FullHistoryTargetFileName,'w',newline='')
csvWritertarget = csv.writer(targetFile)
relatedFile = open("/tmp/"+FullHistoryRelatedFileName,'w',newline='')
csvWriterRelated = csv.writer(relatedFile)
for item in vars.FullHistoryList:
targetRow=[item[0],item[1],item[2]]
relatedRow=[item[0],item[1],item[3]]
csvWritertarget.writerow(targetRow)
csvWriterRelated.writerow(relatedRow)
currentDay=simulateStartDate
while(currentDay<=simulateEndDate):
for item in vars.ItemList:
rowItemForTheDay=[]
rowItemForTheDay.append(tranformDateToString(currentDay))
rowItemForTheDay.append(item)
rowItemForTheDay.append(getRowValueForTheDay(vars.EndDate,item,"relatedValue1"))
csvWriterRelated.writerow(rowItemForTheDay)
currentDay=currentDay+timedelta(days=1)
targetFile.close()
relatedFile.close()
s3_client.upload_file("/tmp/"+FullHistoryTargetFileName, S3BucketName, "DatasetGroups/"+datasetGroupName+"/target.csv")
s3_client.upload_file("/tmp/"+FullHistoryRelatedFileName, S3BucketName, "DatasetGroups/"+datasetGroupName+"/related.csv")
logger.info("processed data uploaded to bucket="+S3BucketName+", under path key=DatasetGroups/"+datasetGroupName)