Import data from the current directory and write to default dump file
from dnnclim import data
import os
import pickle
climdata = data.process_dir('.')
tempfiles : ['./tas_Amon_CESM1-CAM5_rcp26_r1i1p1_200601-210012.nc', './tas_Amon_CESM1-CAM5_rcp26_r2i1p1_200601-210012.nc', './tas_Amon_CESM1-CAM5_rcp26_r3i1p1_200601-210012.nc']
prfiles : ['./pr_Amon_CESM1-CAM5_rcp26_r1i1p1_200601-210012.nc', './pr_Amon_CESM1-CAM5_rcp26_r2i1p1_200601-210012.nc', './pr_Amon_CESM1-CAM5_rcp26_r3i1p1_200601-210012.nc']
topofiles : ['./sftlf_fx_CESM1-CAM5_historical_r0i0p0.nc', './orog_fx_CESM1-CAM5_historical_r0i0p0.nc']
Data checks passed.
dim fields = (95, 192, 288)
nscen = 3
dim allfields = (285, 192, 288, 2)
dim allgmeans = (285, 2)
total cases: 285
training cases: 142
[107 94 227 42 23 222 118 179 155 95 169 66 44 261 128 172 230 29
255 170 266 218 146 121 152 196 280 101 225 36 174 145 197 154 84 248
31 20 178 257 28 233 241 144 126 213 122 164 78 278 156 148 12 79
246 5 210 176 244 260 268 57 160 264 236 279 234 150 113 127 104 238
185 35 13 192 195 136 202 263 151 206 82 22 284 180 46 85 80 15
182 88 45 30 103 208 116 194 186 105 231 96 10 74 211 3 19 190
221 243 39 162 112 271 215 115 100 259 0 120 24 93 73 153 167 90
102 17 108 40 72 184 191 256 237 161 189 21 63 138 168 193]
dev cases: 71
[ 76 253 228 8 129 139 99 181 159 275 49 283 43 204 65 7 188 98
199 262 77 149 220 32 272 111 41 157 270 68 51 245 61 27 106 212
258 232 64 1 86 53 130 251 131 33 110 165 50 147 274 200 34 137
91 219 171 55 52 240 163 209 267 142 117 67 217 214 229 75 58]
test cases: 72
[254 70 48 235 265 38 89 9 281 198 239 62 54 216 125 47 175 173
242 158 25 282 223 249 119 141 132 97 59 207 6 247 69 11 143 2
135 201 18 71 140 134 109 114 269 14 226 224 183 26 276 166 16 203
123 133 4 277 56 273 177 250 124 87 205 81 187 252 60 92 37 83]
topo dim: (192, 288, 2)
for dset in climdata:
print('dataset: {}'.format(dset))
if dset == 'topo':
print('\ttopo: ', climdata[dset].shape)
else:
print('\tfld: ', climdata[dset]['fld'].shape)
print('\tgmean: ', climdata[dset]['gmean'].shape)
dataset: train
fld: (142, 192, 288, 2)
gmean: (142, 2)
dataset: dev
fld: (71, 192, 288, 2)
gmean: (71, 2)
dataset: test
fld: (72, 192, 288, 2)
gmean: (72, 2)
dataset: topo
topo: (192, 288, 2)
Verify data written to dump file
infile = open('dnnclim.dat','rb')
climdata2 = pickle.load(infile)
infile.close()
dict_keys(['fld', 'gmean'])
(climdata['train']['fld'] == climdata2['train']['fld']).all()