Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
D
DART-WRF-delete_byApril
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Deploy
Model registry
Monitor
Service Desk
Analyze
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Terms and privacy
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
DataAssimilation
DART-WRF-delete_byApril
Commits
8bbbdb55
Commit
8bbbdb55
authored
2 years ago
by
lkugler
Browse files
Options
Downloads
Plain Diff
Merge branch 'consistent_config' of
https://github.com/lkugler/DART-WRF
into consistent_config
parents
8618022d
5ac75d8f
No related branches found
No related tags found
No related merge requests found
Changes
3
Hide whitespace changes
Inline
Side-by-side
Showing
3 changed files
dartwrf/assim_synth_obs.py
+18
-19
18 additions, 19 deletions
dartwrf/assim_synth_obs.py
dartwrf/obs/create_obsseq_out.py
+11
-1
11 additions, 1 deletion
dartwrf/obs/create_obsseq_out.py
dartwrf/obs/obsseq.py
+87
-9
87 additions, 9 deletions
dartwrf/obs/obsseq.py
with
116 additions
and
29 deletions
dartwrf/assim_synth_obs.py
+
18
−
19
View file @
8bbbdb55
...
@@ -18,30 +18,24 @@ wrfout_format = 'wrfout_d01_%Y-%m-%d_%H:%M:%S'
...
@@ -18,30 +18,24 @@ wrfout_format = 'wrfout_d01_%Y-%m-%d_%H:%M:%S'
def
_prepare_DART_grid_template
():
def
_prepare_DART_grid_template
():
# DART needs a wrfinput file as a template for the grid
# DART needs a wrfinput file as a template for the grid
# No data will be read from this file, but the grid information must match exactly.
# No data will be read from this file, but the grid information must match exactly.
symlink
(
cluster
.
dartrundir
+
"
/prior_ens1/wrfout_d01
"
,
symlink
(
cluster
.
dart
_
rundir
+
"
/prior_ens1/wrfout_d01
"
,
cluster
.
dartrundir
+
"
/wrfinput_d01
"
)
cluster
.
dart
_
rundir
+
"
/wrfinput_d01
"
)
def
_copy_nature_to_dart
(
time
):
def
_copy_nature_to_dart
(
time
):
"""
Copies wrfout_d01 from nature run to DART directory
"""
Copies wrfout_d01 from nature run to DART directory
TODO: This is a bit of a hack, because it is not explicit about where to take the nature from.
"""
"""
# find the file in any init directory
glob_pattern
=
time
.
strftime
(
exp
.
nature_wrfout_pattern
)
# replace time in pattern
fformat
=
'
wrfout_d01_%Y-%m-%d_%H:%M:%S
'
print
(
'
searching for nature in pattern:
'
,
glob_pattern
)
f_nat
=
glob
.
glob
(
cluster
.
archive_base
+
'
/
'
+
exp
.
nature_expname
+
'
/*/1/
'
+
time
.
strftime
(
fformat
))[
0
]
f_nat
=
glob
.
glob
(
glob_pattern
)[
0
]
# find the nature wrfout-file
shutil
.
copy
(
f_nat
,
cluster
.
dart_rundir
+
"
/wrfout_d01
"
)
# DART may need a wrfinput file as well ?!
# check user input
symlink
(
cluster
.
dart_rundir
+
"
/wrfout_d01
"
,
if
not
'
wrfout
'
in
f_nat
.
split
(
'
/
'
)[
-
1
]:
cluster
.
dart_rundir
+
"
/wrfinput_d01
"
)
warnings
.
warn
(
f
+
"
does not contain
'
wrfout
'
in filename, are you sure this is a valid nature file?
"
)
print
(
"
linked
"
,
f_nat
,
"
to
"
,
cluster
.
dart_rundir
+
"
/wrfout_d01
"
)
f_wrfout_nature
=
time
.
strftime
(
exp
.
nature
+
'
/
'
+
wrfout_format
)
# copy nature wrfout to DART directory
assert
os
.
path
.
exists
(
f_
wrfout_
nature
)
shutil
.
copy
(
f_nat
,
cluster
.
dart_rundir
+
"
/
wrfout_
d01
"
)
print
(
"
linking nature to DART & georeferencing
"
)
# add coordinates if necessary
shutil
.
copy
(
f_wrfout_nature
,
cluster
.
dartrundir
+
"
/wrfout_d01
"
)
print
(
"
linked
"
,
f_wrfout_nature
,
"
to
"
,
cluster
.
dartrundir
+
"
/wrfout_d01
"
)
if
cluster
.
geo_em_for_WRF_ideal
:
if
cluster
.
geo_em_for_WRF_ideal
:
wrfout_add_geo
.
run
(
cluster
.
geo_em_for_WRF_ideal
,
cluster
.
dart_rundir
+
"
/wrfout_d01
"
)
wrfout_add_geo
.
run
(
cluster
.
geo_em_for_WRF_ideal
,
cluster
.
dart_rundir
+
"
/wrfout_d01
"
)
...
@@ -53,7 +47,7 @@ def prepare_nature_dart(time):
...
@@ -53,7 +47,7 @@ def prepare_nature_dart(time):
"""
"""
try
:
try
:
_copy_nature_to_dart
(
time
)
_copy_nature_to_dart
(
time
)
except
File
ExistsError
:
# if nature is not available due to any reason
except
(
File
NotFoundError
,
AttributeError
)
as
e
:
# if nature is not available due to any reason
print
(
'
-> has no nature, not copying nature
'
)
print
(
'
-> has no nature, not copying nature
'
)
...
@@ -369,8 +363,13 @@ def get_obsseq_out(time):
...
@@ -369,8 +363,13 @@ def get_obsseq_out(time):
if
exp
.
use_existing_obsseq
!=
False
:
if
exp
.
use_existing_obsseq
!=
False
:
# use an existing obs_seq.out file
# use an existing obs_seq.out file
f_obsseq
=
time
.
strftime
(
exp
.
use_existing_obsseq
)
f_obsseq
=
time
.
strftime
(
exp
.
use_existing_obsseq
)
copy
(
f_obsseq
,
cluster
.
dart_rundir
+
'
/obs_seq.out
'
)
copy
(
f_obsseq
,
cluster
.
dart_rundir
+
'
/obs_seq.out
'
)
# copy to run_DART folder
print
(
f_obsseq
,
'
copied to
'
,
cluster
.
dart_rundir
+
'
/obs_seq.out
'
)
print
(
f_obsseq
,
'
copied to
'
,
cluster
.
dart_rundir
+
'
/obs_seq.out
'
)
# copy to sim_archive
os
.
makedirs
(
cluster
.
archivedir
+
"
/obs_seq_out/
"
,
exist_ok
=
True
)
copy
(
f_obsseq
,
time
.
strftime
(
cluster
.
archivedir
+
'
/obs_seq_out/%Y-%m-%d_%H:%M_obs_seq.out
'
))
oso
=
obsseq
.
ObsSeq
(
cluster
.
dart_rundir
+
"
/obs_seq.out
"
)
# read the obs_seq.out file
oso
=
obsseq
.
ObsSeq
(
cluster
.
dart_rundir
+
"
/obs_seq.out
"
)
# read the obs_seq.out file
else
:
else
:
# do NOT use an existing obs_seq.out file
# do NOT use an existing obs_seq.out file
...
...
This diff is collapsed.
Click to expand it.
dartwrf/obs/create_obsseq_out.py
+
11
−
1
View file @
8bbbdb55
import
os
,
shutil
,
warnings
import
os
,
shutil
,
warnings
from
dartwrf.utils
import
try_remove
,
print
,
shell
from
dartwrf.utils
import
try_remove
,
print
,
shell
,
symlink
import
dartwrf.obs.create_obsseq_in
as
osi
import
dartwrf.obs.create_obsseq_in
as
osi
from
dartwrf.obs
import
obsseq
from
dartwrf.obs
import
obsseq
from
dartwrf.exp_config
import
exp
from
dartwrf.exp_config
import
exp
from
dartwrf.server_config
import
cluster
from
dartwrf.server_config
import
cluster
def
_prepare_DART_grid_template
():
# DART needs a wrfinput file as a template for the grid
# No data will be read from this file, but the grid information must match exactly.
symlink
(
cluster
.
dart_rundir
+
"
/wrfout_d01
"
,
cluster
.
dart_rundir
+
"
/wrfinput_d01
"
)
def
generate_obsseq_out
(
time
):
def
generate_obsseq_out
(
time
):
"""
Generate an obs_seq.out file from the current experiment
"""
Generate an obs_seq.out file from the current experiment
Expects an existing nature file in the cluster.dart_rundir
Args:
Args:
time (datetime): time of the observations
time (datetime): time of the observations
...
@@ -47,6 +55,8 @@ def generate_obsseq_out(time):
...
@@ -47,6 +55,8 @@ def generate_obsseq_out(time):
os
.
makedirs
(
dir_obsseq
,
exist_ok
=
True
)
os
.
makedirs
(
dir_obsseq
,
exist_ok
=
True
)
osi
.
create_obs_seq_in
(
time
,
exp
.
observations
)
osi
.
create_obs_seq_in
(
time
,
exp
.
observations
)
_prepare_DART_grid_template
()
run_perfect_model_obs
()
# generate observation, draws from gaussian
run_perfect_model_obs
()
# generate observation, draws from gaussian
print
(
"
2.1) obs preprocessing
"
)
print
(
"
2.1) obs preprocessing
"
)
...
...
This diff is collapsed.
Click to expand it.
dartwrf/obs/obsseq.py
+
87
−
9
View file @
8bbbdb55
...
@@ -36,6 +36,8 @@ import os, warnings
...
@@ -36,6 +36,8 @@ import os, warnings
import
numpy
as
np
import
numpy
as
np
import
pandas
as
pd
import
pandas
as
pd
missing_value
=
-
888888.0
def
_plot_box
(
m
,
lat
,
lon
,
label
=
""
,
**
kwargs
):
def
_plot_box
(
m
,
lat
,
lon
,
label
=
""
,
**
kwargs
):
""""
Draw bounding box
""""
Draw bounding box
...
@@ -141,6 +143,61 @@ class ObsRecord(pd.DataFrame):
...
@@ -141,6 +143,61 @@ class ObsRecord(pd.DataFrame):
assert
np
.
allclose
(
Hx
.
mean
(
axis
=
1
),
self
[
what
+
'
ensemble mean
'
])
assert
np
.
allclose
(
Hx
.
mean
(
axis
=
1
),
self
[
what
+
'
ensemble mean
'
])
return
Hx
.
values
return
Hx
.
values
def
get_model_grid_indices
(
self
,
wrf_file_with_grid
):
"""
Retrieve the grid indices closest to the observations
Note:
Only the horizontal grid is considered
Args:
wrf_file_with_grid (str): path to wrf file with grid information
Returns:
pd.DataFrame (n_obs, 2) columns: i, j
"""
from
scipy
import
spatial
import
xarray
as
xr
def
find_index_from_coords_tree
(
tree
,
len_latitudes
,
lat
=
45.
,
lon
=
0.
):
"""
Find Lat & Lon indices in array
to find the state space values nearest to the observation
Args:
len_latitudes (int) : usually xlat.shape[0]
actually this could also have to be len of longitudes (i dont know!)
but it works if len(xlon)==len(xlat)
Returns:
ilat, ilon (int)
"""
dd
,
ii
=
tree
.
query
([[
lat
,
lon
],])
ilat
=
int
(
ii
/
len_latitudes
)
ilon
=
int
(
ii
%
len_latitudes
)
return
ilat
,
ilon
# load coordinates of wrf grid
grid
=
xr
.
open_dataset
(
wrf_file_with_grid
)
xlat
=
grid
.
XLAT_M
.
values
.
squeeze
()
xlon
=
grid
.
XLONG_M
.
values
.
squeeze
()
# build search tree
tree
=
spatial
.
KDTree
(
np
.
c_
[
xlat
.
ravel
(),
xlon
.
ravel
()])
# get lat lon of observations
lon_lat
=
self
.
get_lon_lat
()
ilat_ilon
=
np
.
empty
((
len
(
lon_lat
),
2
),
np
.
int32
)
# find indices of observations in wrf grid
for
i
,
row
in
lon_lat
.
iterrows
():
ilat_ilon
[
i
,:]
=
find_index_from_coords_tree
(
tree
,
xlat
.
shape
[
0
],
row
.
lat
,
row
.
lon
)
return
pd
.
DataFrame
(
index
=
self
.
index
,
data
=
dict
(
wrf_i
=
ilat_ilon
[:,
0
],
wrf_j
=
ilat_ilon
[:,
1
]))
def
get_lon_lat
(
self
):
def
get_lon_lat
(
self
):
"""
Retrieve longitude and latitude of observations
"""
Retrieve longitude and latitude of observations
...
@@ -190,21 +247,26 @@ class ObsRecord(pd.DataFrame):
...
@@ -190,21 +247,26 @@ class ObsRecord(pd.DataFrame):
return
nlayers
return
nlayers
def
superob
(
self
,
window_km
):
def
superob
(
self
,
window_km
):
"""
Select subset, average, overwrite existing obs with average
"""
Create super-observations (averaged observations)
TODO: allow different obs types (KIND)
TODO: loc3d overwrite with mean
Metadata is copied from the first obs in a superob-box
Note:
Note:
This routine discards observations (round off)
This routine discards observations (round off)
e.g. 31 obs with 5 obs-window => obs #31 is not processed
e.g. 31 obs with 5 obs-window => obs #31 is not processed.
Metadata is copied from the first observation in a superob-box
The location (loc3d) of new observation is taken from the center observation
TODO: allow different obs types (KIND)
Args:
Args:
window_km (numeric): horizontal window edge length
window_km (numeric): horizontal window edge length
includes obs on edge
includes obs on edge
25x25 km with 5 km obs density
25x25 km with 5 km obs density
= average 5 x 5 observations
= average 5 x 5 observations
Returns:
ObsRecord
"""
"""
def
calc_deg_from_km
(
distance_km
,
center_lat
):
def
calc_deg_from_km
(
distance_km
,
center_lat
):
"""
Approximately calculate distance in degrees from meters
"""
Approximately calculate distance in degrees from meters
...
@@ -264,9 +326,17 @@ class ObsRecord(pd.DataFrame):
...
@@ -264,9 +326,17 @@ class ObsRecord(pd.DataFrame):
out
=
self
.
drop
(
self
.
index
)
# this df will be filled
out
=
self
.
drop
(
self
.
index
)
# this df will be filled
boxes
=
[]
boxes
=
[]
for
i
in
range
(
0
,
nx
+
1
-
win_obs
,
win_obs
):
for
i
in
range
(
0
,
nx
+
1
-
win_obs
,
win_obs
):
# i is the number of observations in x direction
# but in steps of "number of observations in superob window"
# i.e. i = 0, win_obs, 2*win_obs, 3*win_obs, ...
for
j
in
range
(
0
,
nx
+
1
-
win_obs
,
win_obs
):
for
j
in
range
(
0
,
nx
+
1
-
win_obs
,
win_obs
):
# same as i but in y direction
for
k
in
range
(
0
,
nlayers
):
for
k
in
range
(
0
,
nlayers
):
# k is the index of the vertical layer
if
debug
:
print
(
i
,
j
,
k
)
if
debug
:
print
(
i
,
j
,
k
)
# find indices of observations within superob window
# find indices of observations within superob window
...
@@ -301,7 +371,7 @@ class ObsRecord(pd.DataFrame):
...
@@ -301,7 +371,7 @@ class ObsRecord(pd.DataFrame):
# average spread and other values
# average spread and other values
for
key
in
obs_box
:
for
key
in
obs_box
:
if
key
in
[
'
loc3d
'
,
'
kind
'
,
'
metadata
'
,
'
time
'
]:
if
key
in
[
'
loc3d
'
,
'
kind
'
,
'
metadata
'
,
'
time
'
]:
pass
pass
# these parameters are not averaged
elif
'
spread
'
in
key
:
elif
'
spread
'
in
key
:
# stdev of mean of values = sqrt(mean of variances)
# stdev of mean of values = sqrt(mean of variances)
obs_mean
.
at
[
key
]
=
np
.
sqrt
((
obs_box
[
key
]
**
2
).
mean
())
obs_mean
.
at
[
key
]
=
np
.
sqrt
((
obs_box
[
key
]
**
2
).
mean
())
...
@@ -503,8 +573,16 @@ class ObsSeq(object):
...
@@ -503,8 +573,16 @@ class ObsSeq(object):
if
"
kind
"
in
line
:
# find obs kind
if
"
kind
"
in
line
:
# find obs kind
line_kind
=
i
+
1
line_kind
=
i
+
1
# read values like 'observations', 'truth', 'prior ensemble mean'
for
k
,
key
in
enumerate
(
self
.
keys_for_values
):
for
k
,
key
in
enumerate
(
self
.
keys_for_values
):
out
[
key
]
=
float
(
lines
[
1
+
k
].
strip
())
v
=
float
(
lines
[
1
+
k
].
strip
())
# value in obs_seq file
if
v
==
missing_value
:
# e.g. -888888.0
out
[
key
]
=
np
.
nan
else
:
out
[
key
]
=
v
x
,
y
,
z
,
z_coord
=
lines
[
line_loc
].
split
()
x
,
y
,
z
,
z_coord
=
lines
[
line_loc
].
split
()
out
[
"
loc3d
"
]
=
float
(
x
),
float
(
y
),
float
(
z
),
int
(
z_coord
)
out
[
"
loc3d
"
]
=
float
(
x
),
float
(
y
),
float
(
z
),
int
(
z_coord
)
...
...
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment