%matplotlib inline
import pandas as pd
import socket
host = socket.getfqdn()
from core import load, zoom, calc, save,plots,monitor
#reload funcs after updating ./core/*.py
import importlib
importlib.reload(load)
importlib.reload(zoom)
importlib.reload(calc)
importlib.reload(save)
importlib.reload(plots)
importlib.reload(monitor)
<module 'core.monitor' from '/ccc/work/cont003/gen7420/odakatin/monitor-sedna/notebook/core/monitor.py'>
# 'month': = 'JOBID' almost month but not really,
# If you submit the job with job scheduler, above
#below are list of enviroment variable one can pass
#%env local='2"
# local : if True run dask local cluster, if not true, put number of workers
# setted in the 'local'
# if no 'local ' given, local will be setted automatically to 'True'
#%env ychunk='2'
#%env tchunk='2'
# controls chunk. 'False' sets no modification from original netcdf file's chunk.
# ychunk=10 will group the original netcdf file to 10 by 10
# tchunk=1 will chunk the time coordinate one by one
#%env control=FWC_SSH
# name of control file to be used for computation/plots/save/
#%env file_exp=
# 'file_exp': Which 'experiment' name is it?
#. this corresopnds to intake catalog name without path and .yaml
#%env year=
# for Validation, this correspoinds to path/year/month 's year
# for monitoring, this corresponids to 'date' having * means do all files in the monitoring directory
# setting it as *0[0-9] &*1[0-9]& *[2-3][0-9], the job can be separated in three lots.
#%env month=
# for monitoring this corresponds to file path path-XIOS.{month}/
#
#%env save= proceed saving? True or False , Default is setted as True
#%env plot= proceed plotting? True or False , Default is setted as True
#%env calc= proceed computation? or just load computed result? True or False , Default is setted as True
#%env save=False
#%env lazy=False
%%time
# 'savefig': Do we save output in html? or not. keep it true.
savefig=True
client,cluster,control,catalog_url,month,year,daskreport,outputpath = load.set_control(host)
!mkdir -p $outputpath
!mkdir -p $daskreport
client
local True using host= irene6085.c-irene.mg1.tgcc.ccc.cea.fr starting dask cluster on local= True workers 16 10000000000 False rome local cluster starting This code is running on irene6085.c-irene.mg1.tgcc.ccc.cea.fr using SEDNA_DELTA_MONITOR file experiment, read from ../lib/SEDNA_DELTA_MONITOR.yaml on year= 2012 on month= 01 outputpath= ../results/SEDNA_DELTA_MONITOR/ daskreport= ../results/dask/6413859irene6085.c-irene.mg1.tgcc.ccc.cea.fr_SEDNA_DELTA_MONITOR_01M_IceConce/_lazyTrue CPU times: user 516 ms, sys: 113 ms, total: 629 ms Wall time: 19.2 s
Client-48ebf8c3-1346-11ed-a09c-080038b93e73
Connection method: Cluster object | Cluster type: distributed.LocalCluster |
Dashboard: http://127.0.0.1:8787/status |
717c3f80
Dashboard: http://127.0.0.1:8787/status | Workers: 16 |
Total threads: 128 | Total memory: 251.06 GiB |
Status: running | Using processes: True |
Scheduler-0c1f1e0b-1609-4c79-9270-c9352b493e8f
Comm: tcp://127.0.0.1:33753 | Workers: 16 |
Dashboard: http://127.0.0.1:8787/status | Total threads: 128 |
Started: Just now | Total memory: 251.06 GiB |
Comm: tcp://127.0.0.1:46846 | Total threads: 8 |
Dashboard: http://127.0.0.1:34628/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:42261 | |
Local directory: /tmp/dask-worker-space/worker-td6ywixt |
Comm: tcp://127.0.0.1:40865 | Total threads: 8 |
Dashboard: http://127.0.0.1:40704/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:35026 | |
Local directory: /tmp/dask-worker-space/worker-u7_4r92u |
Comm: tcp://127.0.0.1:37831 | Total threads: 8 |
Dashboard: http://127.0.0.1:44113/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:46861 | |
Local directory: /tmp/dask-worker-space/worker-4nyffiei |
Comm: tcp://127.0.0.1:46021 | Total threads: 8 |
Dashboard: http://127.0.0.1:46059/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:38718 | |
Local directory: /tmp/dask-worker-space/worker-nc6nzw7z |
Comm: tcp://127.0.0.1:45037 | Total threads: 8 |
Dashboard: http://127.0.0.1:37837/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:45689 | |
Local directory: /tmp/dask-worker-space/worker-ctq_lyc5 |
Comm: tcp://127.0.0.1:33174 | Total threads: 8 |
Dashboard: http://127.0.0.1:35559/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:43919 | |
Local directory: /tmp/dask-worker-space/worker-8gglop1_ |
Comm: tcp://127.0.0.1:34905 | Total threads: 8 |
Dashboard: http://127.0.0.1:36759/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:38399 | |
Local directory: /tmp/dask-worker-space/worker-t66up4ht |
Comm: tcp://127.0.0.1:38223 | Total threads: 8 |
Dashboard: http://127.0.0.1:43678/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:38246 | |
Local directory: /tmp/dask-worker-space/worker-iidkc31y |
Comm: tcp://127.0.0.1:46741 | Total threads: 8 |
Dashboard: http://127.0.0.1:45512/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:46519 | |
Local directory: /tmp/dask-worker-space/worker-vb0af9so |
Comm: tcp://127.0.0.1:39481 | Total threads: 8 |
Dashboard: http://127.0.0.1:35514/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:44945 | |
Local directory: /tmp/dask-worker-space/worker-ac6frhag |
Comm: tcp://127.0.0.1:34723 | Total threads: 8 |
Dashboard: http://127.0.0.1:33045/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:44846 | |
Local directory: /tmp/dask-worker-space/worker-g3ijago0 |
Comm: tcp://127.0.0.1:42797 | Total threads: 8 |
Dashboard: http://127.0.0.1:35615/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:41070 | |
Local directory: /tmp/dask-worker-space/worker-ottkprmc |
Comm: tcp://127.0.0.1:35894 | Total threads: 8 |
Dashboard: http://127.0.0.1:43296/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:44812 | |
Local directory: /tmp/dask-worker-space/worker-jnqat1m1 |
Comm: tcp://127.0.0.1:39324 | Total threads: 8 |
Dashboard: http://127.0.0.1:41639/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:32997 | |
Local directory: /tmp/dask-worker-space/worker-gzhyfajl |
Comm: tcp://127.0.0.1:37696 | Total threads: 8 |
Dashboard: http://127.0.0.1:45651/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:36129 | |
Local directory: /tmp/dask-worker-space/worker-dp72nds0 |
Comm: tcp://127.0.0.1:36371 | Total threads: 8 |
Dashboard: http://127.0.0.1:36063/status | Memory: 15.69 GiB |
Nanny: tcp://127.0.0.1:38216 | |
Local directory: /tmp/dask-worker-space/worker-fncr1uv7 |
df=load.controlfile(control)
#Take out 'later' tagged computations
#df=df[~df['Value'].str.contains('later')]
df
Value | Inputs | Equation | Zone | Plot | Colourmap | MinMax | Unit | Oldname | Unnamed: 10 | |
---|---|---|---|---|---|---|---|---|---|---|
IceConce | icemod.siconc | (data.siconc.where(data.siconc >0)).to_dataset... | ALL | maps | Blues | None | M-4 |
Each computation consists of
%%time
import os
calcswitch=os.environ.get('calc', 'True')
lazy=os.environ.get('lazy','True' )
loaddata=((df.Inputs != '').any())
print('calcswitch=',calcswitch,'df.Inputs != nothing',loaddata, 'lazy=',lazy)
data = load.datas(catalog_url,df.Inputs,month,year,daskreport,lazy=lazy) if ((calcswitch=='True' )*loaddata) else 0
data
calcswitch= True df.Inputs != nothing True lazy= True ../lib/SEDNA_DELTA_MONITOR.yaml using param_xios reading ../lib/SEDNA_DELTA_MONITOR.yaml using param_xios reading <bound method DataSourceBase.describe of sources: param_xios: args: combine: nested concat_dim: y urlpath: /ccc/work/cont003/gen7420/odakatin/CONFIGS/SEDNA/SEDNA-I/SEDNA_Domain_cfg_Tgt_20210423_tsh10m_L1/param_f32/x_*.nc xarray_kwargs: compat: override coords: minimal data_vars: minimal parallel: true description: SEDNA NEMO parameters from MPI output nav_lon lat fails driver: intake_xarray.netcdf.NetCDFSource metadata: catalog_dir: /ccc/work/cont003/gen7420/odakatin/monitor-sedna/notebook/../lib/ > {'name': 'param_xios', 'container': 'xarray', 'plugin': ['netcdf'], 'driver': ['netcdf'], 'description': 'SEDNA NEMO parameters from MPI output nav_lon lat fails', 'direct_access': 'forbid', 'user_parameters': [{'name': 'path', 'description': 'file coordinate', 'type': 'str', 'default': '/ccc/work/cont003/gen7420/odakatin/CONFIGS/SEDNA/MESH/SEDNA_mesh_mask_Tgt_20210423_tsh10m_L1/param'}], 'metadata': {}, 'args': {'urlpath': '/ccc/work/cont003/gen7420/odakatin/CONFIGS/SEDNA/SEDNA-I/SEDNA_Domain_cfg_Tgt_20210423_tsh10m_L1/param_f32/x_*.nc', 'combine': 'nested', 'concat_dim': 'y'}} 0 read icemod ['siconc'] using load_data_xios reading icemod using load_data_xios reading {'name': 'data_xios', 'container': 'xarray', 'plugin': ['netcdf'], 'driver': ['netcdf'], 'description': 'SEDNA NEMO outputs from different xios server', 'direct_access': 'forbid', 'user_parameters': [{'name': 'path', 'description': 'name of config', 'type': 'str', 'default': '/ccc/scratch/cont003/gen7420/talandel/SEDNA/SEDNA-DELTA-S/SPLIT/1d'}, {'name': 'fileexp', 'description': 'name of config', 'type': 'str', 'default': 'SEDNA-DELTA'}, {'name': 'month', 'description': 'running number 2 digit', 'type': 'str', 'default': '02'}, {'name': 'freq', 'description': '1d or 1m', 'type': 'str', 'default': '1d'}, {'name': 'year', 'description': 'last digits of yearmonthdate.', 'type': 'str', 'default': '2012'}, {'name': 'file', 'description': 'file name', 'type': 'str', 'default': 'icemod'}, {'name': 'eio', 'description': 'xios mpi number', 'type': 'str', 'default': '0[0-5][0-9][0-9]'}], 'metadata': {}, 'args': {'urlpath': '{{path}}/{{year}}/{{month}}/*{{file}}_*_{{eio}}.nc', 'combine': 'nested', 'concat_dim': 'time_counter,x,y'}} took 132.51184225082397 seconds 0 merging icemod ['siconc'] param nav_lat will be included in data param nav_lon will be included in data param mask2d will be included in data ychunk= 10 calldatas_y_rechunk sum_num (13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 13, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12) start rechunking with (130, 122, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 120, 48) end of y_rechunk CPU times: user 1min 24s, sys: 6.38 s, total: 1min 30s Wall time: 2min 35s
<xarray.Dataset> Dimensions: (t: 31, y: 6540, x: 6560) Coordinates: * t (t) object 2012-01-01 12:00:00 ... 2012-01-31 12:00:00 * y (y) int64 1 2 3 4 5 6 7 ... 6535 6536 6537 6538 6539 6540 * x (x) int64 1 2 3 4 5 6 7 ... 6555 6556 6557 6558 6559 6560 nav_lat (y, x) float32 dask.array<chunksize=(130, 6560), meta=np.ndarray> nav_lon (y, x) float32 dask.array<chunksize=(130, 6560), meta=np.ndarray> time_centered (t) object dask.array<chunksize=(31,), meta=np.ndarray> mask2d (y, x) bool dask.array<chunksize=(130, 6560), meta=np.ndarray> Data variables: siconc (t, y, x) float32 dask.array<chunksize=(31, 130, 6560), meta=np.ndarray> Attributes: (12/26) name: /ccc/scratch/cont003/ra5563/talandel/ONGOING-RUN... description: ice variables title: ice variables Conventions: CF-1.6 timeStamp: 2022-Jan-17 19:00:05 GMT uuid: 65f78891-6a37-4a91-8ad4-7c8b5dc0d456 ... ... start_date: 20090101 output_frequency: 1d CONFIG: SEDNA CASE: DELTA history: Tue Jan 18 17:20:08 2022: ncks -4 -L 1 SEDNA-DEL... NCO: netCDF Operators version 4.9.1 (Homepage = http:...
%%time
monitor.auto(df,data,savefig,daskreport,outputpath,file_exp='SEDNA'
)
#calc= True #save= True #plot= False monitor.optimize_dataset(data) Value='IceConce' Zone='ALL' Plot='maps' cmap='Blues' clabel=' ' clim= None outputpath='../results/SEDNA_DELTA_MONITOR/' nc_outputpath='../nc_results/SEDNA_DELTA_MONITOR/' filename='SEDNA_maps_ALL_IceConce' #3 Start computing dtaa= (data.siconc.where(data.siconc >0)).to_dataset(name='siconc').chunk({ 't': -1 }).unify_chunks().persist() monitor.optimize_dataset(dtaa)
<xarray.Dataset> Dimensions: (t: 31, y: 6540, x: 6560) Coordinates: * t (t) object 2012-01-01 12:00:00 ... 2012-01-31 12:00:00 * y (y) int64 1 2 3 4 5 6 7 ... 6535 6536 6537 6538 6539 6540 * x (x) int64 1 2 3 4 5 6 7 ... 6555 6556 6557 6558 6559 6560 nav_lat (y, x) float32 dask.array<chunksize=(130, 6560), meta=np.ndarray> nav_lon (y, x) float32 dask.array<chunksize=(130, 6560), meta=np.ndarray> time_centered (t) object dask.array<chunksize=(31,), meta=np.ndarray> mask2d (y, x) bool dask.array<chunksize=(130, 6560), meta=np.ndarray> Data variables: siconc (t, y, x) float32 dask.array<chunksize=(31, 130, 6560), meta=np.ndarray>
#4 Saving SEDNA_maps_ALL_IceConce dtaa=save.datas(data,plot=Plot,path=nc_outputpath,filename=filename) start saving data saving data in a file
--------------------------------------------------------------------------- UnboundLocalError Traceback (most recent call last) File <timed eval>:1, in <module> File /ccc/work/cont003/gen7420/odakatin/monitor-sedna/notebook/core/monitor.py:84, in auto(df, val, savefig, daskreport, outputpath, file_exp) 82 print('dtaa=save.datas(data,plot=Plot,path=nc_outputpath,filename=filename)' ) 83 with performance_report(filename=daskreport+"_save_"+step.Value+".html"): ---> 84 save.datas(data,plot=Plot,path=nc_outputpath,filename=filename) 85 # 5. Plot 86 if plotswitch=='True': File /ccc/work/cont003/gen7420/odakatin/monitor-sedna/notebook/core/save.py:24, in datas(data, plot, path, filename) 22 twoD(data,path,filename,nested=False) 23 else : ---> 24 twoD(data,path,filename) 25 return None File /ccc/work/cont003/gen7420/odakatin/monitor-sedna/notebook/core/save.py:57, in twoD(data, path, filename, nested) 55 print('saving data in a file') 56 filesave=path+filename ---> 57 return to_mfnetcdf_map(data,prefix=filesave, nested=nested) File /ccc/work/cont003/gen7420/odakatin/monitor-sedna/notebook/core/save.py:219, in to_mfnetcdf_map(ds, prefix, nested) 217 slices.append(slice(start, stop)) 218 start = stop --> 219 chunk_slices[dim] = slices 220 for i in chunk_slices['t']: 221 print(i) UnboundLocalError: local variable 'slices' referenced before assignment