Skip to content
Snippets Groups Projects
Commit 70277c4f authored by David Verelst's avatar David Verelst
Browse files

prepost.dlctemplate: add option to merge postpro_node into one DataFrame

parent 95b1f01d
No related branches found
No related tags found
No related merge requests found
Pipeline #
...@@ -19,15 +19,14 @@ import socket ...@@ -19,15 +19,14 @@ import socket
from argparse import ArgumentParser from argparse import ArgumentParser
from sys import platform from sys import platform
#import numpy as np import numpy as np
#import pandas as pd import pandas as pd
from matplotlib import pyplot as plt from matplotlib import pyplot as plt
#import matplotlib as mpl #import matplotlib as mpl
from wetb.prepost import Simulations as sim from wetb.prepost import Simulations as sim
from wetb.prepost import dlcdefs from wetb.prepost import (dlcdefs, dlcplots, windIO)
from wetb.prepost import dlcplots from wetb.prepost.simchunks import (create_chunks_htc_pbs, AppendDataFrames)
from wetb.prepost.simchunks import create_chunks_htc_pbs
from wetb.prepost.GenerateDLCs import GenerateDLCCases from wetb.prepost.GenerateDLCs import GenerateDLCCases
plt.rc('font', family='serif') plt.rc('font', family='serif')
...@@ -459,6 +458,56 @@ def post_launch(sim_id, statistics=True, rem_failed=True, check_logs=True, ...@@ -459,6 +458,56 @@ def post_launch(sim_id, statistics=True, rem_failed=True, check_logs=True,
return df_stats, df_AEP, df_Leq return df_stats, df_AEP, df_Leq
def postpro_node_merge():
# -------------------------------------------------------------------------
# MERGE POSTPRO ON NODE APPROACH INTO ONE DataFrame
# -------------------------------------------------------------------------
lf = windIO.LogFile()
path_pattern = os.path.join(P_RUN, 'logfiles', '*', '*.csv')
csv_fname = '%s_ErrorLogs.csv' % sim_id
fcsv = os.path.join(POST_DIR, csv_fname)
mdf = AppendDataFrames(tqdm=False)
# individual log file analysis does not have header, make sure to include
# a line for the header
mdf.txt2txt(fcsv, path_pattern, tarmode='r:xz', header=None,
header_fjoined=lf._header(), recursive=True)
# convert from CSV to DataFrame
df = lf.csv2df(fcsv)
df.to_hdf(fcsv.replace('.csv', '.h5'), 'table')
# -------------------------------------------------------------------------
path_pattern = os.path.join(P_RUN, 'res', '*', '*.csv')
csv_fname = '%s_statistics.csv' % sim_id
fcsv = os.path.join(POST_DIR, csv_fname)
mdf = AppendDataFrames(tqdm=True)
# individual log file analysis does not have header, make sure to include
# a line for the header
mdf.txt2txt(fcsv, path_pattern, tarmode='r:xz', header=0, sep=',',
header_fjoined=None, recursive=True, fname_col='[case_id]')
# and convert to df: takes 2 minutes
fdf = fcsv.replace('.csv', '.h5')
store = pd.HDFStore(fdf, mode='w', format='table', complevel=9,
complib='zlib')
colnames = ['channel', 'max', 'min', 'mean', 'std', 'range',
'absmax', 'rms', 'int', 'm=3', 'm=4', 'm=6', 'm=8', 'm=10',
'm=12', 'intabs', '[case_id]']
dtypes = {col:np.float64 for col in colnames}
dtypes['channel'] = str
dtypes['[case_id]'] = str
mdf.csv2df_chunks(store, fcsv, chunksize=300000, min_itemsize={}, sep=',',
colnames=colnames, dtypes=dtypes, header=0)
store.close()
# -------------------------------------------------------------------------
# merge missing cols onto stats
required = ['[DLC]', '[run_dir]', '[wdir]', '[Windspeed]', '[res_dir]',
'[case_id]']
df = pd.read_hdf(fdf, 'table')
cc = sim.Cases(POST_DIR, sim_id)
df_tags = cc.cases2df()[required]
df_stats = pd.merge(df, df_tags, on=['[case_id]'])
df_stats.to_hdf(fdf, 'table')
df_stats.to_csv(fdf.replace('.h5', '.csv'))
if __name__ == '__main__': if __name__ == '__main__':
parser = ArgumentParser(description = "pre- or post-processes DLC's") parser = ArgumentParser(description = "pre- or post-processes DLC's")
...@@ -516,6 +565,12 @@ if __name__ == '__main__': ...@@ -516,6 +565,12 @@ if __name__ == '__main__':
dest='postpro_node', help='Perform the log analysis ' dest='postpro_node', help='Perform the log analysis '
'and stats calculation on the node right after the ' 'and stats calculation on the node right after the '
'simulation has finished.') 'simulation has finished.')
parser.add_argument('--postpro_node_merge', default=False,
action='store_true', dest='postpro_node_merge',
help='Merge all individual statistics and log file '
'analysis .csv files into one table/pd.DataFrame. '
'Requires that htc files have been created with '
'--prep --postpro_node.')
parser.add_argument('--gendlcs', default=False, action='store_true', parser.add_argument('--gendlcs', default=False, action='store_true',
help='Generate DLC exchange files based on master DLC ' help='Generate DLC exchange files based on master DLC '
'spreadsheet.') 'spreadsheet.')
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment