Skip to content

Commit

Permalink
BCReader module implemented, rebased
Browse files Browse the repository at this point in the history
  • Loading branch information
juliasloan25 committed Dec 12, 2022
1 parent b230014 commit c123e61
Show file tree
Hide file tree
Showing 15 changed files with 1,123 additions and 170 deletions.
11 changes: 11 additions & 0 deletions .buildkite/pipeline.yml
Original file line number Diff line number Diff line change
Expand Up @@ -77,6 +77,17 @@ steps:
slurm_nodes: 3
slurm_tasks_per_node: 1

- label: "MPI BCReader unit tests"
key: "bcreader_mpi_tests"
command: "mpiexec julia --color=yes --project=test/ test/mpi_tests/bcreader_mpi_tests.jl"
timeout_in_minutes: 20
env:
CLIMACORE_DISTRIBUTED: "MPI"
agents:
config: cpu
queue: central
slurm_nodes: 3
slurm_tasks_per_node: 1

- group: "Integration Tests"
steps:
Expand Down
2 changes: 1 addition & 1 deletion docs/make.jl
Original file line number Diff line number Diff line change
Expand Up @@ -57,7 +57,7 @@ experiment_pages = [
"AMIP" => map(s -> "generated/amip/$(s)", readdir(joinpath(@__DIR__, "src/generated/amip"))),
]
interface_pages =
["couplerstate.md", "timestepping.md", "regridder.md", "conservation.md", "utilities.md", "testhelper.md"]
["couplerstate.md", "timestepping.md", "regridder.md", "conservation.md", "utilities.md", "bcreader.md", "testhelper.md"]

pages = Any["Home" => "index.md", "Examples" => experiment_pages, "Coupler Interface" => interface_pages]

Expand Down
23 changes: 23 additions & 0 deletions docs/src/bcreader.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,23 @@
# BCReader

This module coordinates reading of boundary conditions from NetCDF files,
as well as regridding calls and temporal interpolations from
monthly to daily intervals.

## BCReader API

```@docs
ClimaCoupler.BCReader.BCFileInfo
ClimaCoupler.BCReader.bcfile_info_init
ClimaCoupler.BCReader.update_midmonth_data!
ClimaCoupler.BCReader.next_date_in_file
ClimaCoupler.BCReader.interpolate_midmonth_to_daily
```


## BCReader Internal Functions

```@docs
ClimaCoupler.BCReader.no_scaling
ClimaCoupler.BCReader.interpol
```
309 changes: 309 additions & 0 deletions src/BCReader.jl
Original file line number Diff line number Diff line change
@@ -0,0 +1,309 @@
#=
BCReader
This module coordinates reading of boundary conditions from NetCDF files,
as well as regridding calls and temporal interpolations from
monthly to daily intervals.
=#
module BCReader

using ..Utilities, ..Regridder, ..CallbackManager
using ClimaCore: Fields
using ClimaComms
using Dates
using JLD2

export BCFileInfo, bcfile_info_init, update_midmonth_data!, next_date_in_file, interpolate_midmonth_to_daily


"""
BCFileInfo
Stores information specific to each boundary condition from a file and each variable.
# Inputs
FT::F # float type
bcfile_dir::b # directory of the BC file
comms_ctx::X # communication context used for MPI
hd_outfile_root::S # filename root for regridded data
varname::V # name of the variable
all_dates::D # vector of all dates contained in the original data file
segment_idx::Vector{Int} # index of the monthly data in the file
segment_idx0::Vector{Int} # `segment_idx` of the file data that is closest to date0
monthly_fields::C # tuple of the two monthly fields, that will be used for the daily interpolation
segment_length::Vector{Int} # length of each month segment (used in the daily interpolation)
scaling_function::O # function that scales, offsets or transforms the raw variable
interpolate_daily::Bool # switch to trigger daily interpolation
land_mask::M # mask with 1 = land, 0 = ocean / sea-ice
"""
struct BCFileInfo{F, B, X, S, V, D, C, O, M}
FT::F
bcfile_dir::B
comms_ctx::X
hd_outfile_root::S
varname::V
all_dates::D
segment_idx::Vector{Int}
segment_idx0::Vector{Int}
monthly_fields::C
segment_length::Vector{Int}
scaling_function::O
interpolate_daily::Bool
land_mask::M
end

"""
no_scaling(field, bcf_info)
Remap the values of a field onto the space of the
BCFileInfo's land_mask without scaling.
# Arguments
- `field`: [Fields.Field] contains the values to be remapped.
- `bcf_info`: [BCFileInfo] contains a land_mask to remap onto the space of.
"""
no_scaling(field::Fields.Field, bcf_info::BCFileInfo) = Utilities.swap_space!(field, axes(bcf_info.land_mask))

"""
bcfile_info_init(
FT,
datafile_rll,
varname,
boundary_space;
comms_ctx = ClimaComms.SingletonCommsContext(),
interpolate_daily = false,
segment_idx0 = nothing,
scaling_function = no_scaling,
land_mask = nothing,
date0 = nothing,
mono = true,
)
Regrids from lat-lon grid to cgll grid, saving the output in a new file,
and returns the info packaged in a single struct.
# Arguments
- `FT`: [DataType] Float type.
- `bcfile_dir`: [String] directory the BC file is stored in.
- `datafile_rll`: [String] file containing data to regrid.
- `varname`: [String] name of the variable to be regridded.
- `boundary_space`: [Spaces.AbstractSpace] the space to which we are mapping.
- `comms_ctx`: [ClimaComms.AbstractCommsContext] context used for this operation.
- `interpolate_daily`: [Bool] switch to trigger daily interpolation.
- `segment_idx0`: [Vector{Int}] index of the file data that is closest to date0.
- `scaling function`: [Function] scales, offsets or transforms `varname`.
- `land_mask`: [Fields.field] mask with 1 = land, 0 = ocean / sea-ice.
- `date0`: [Dates.DateTime] start date of the file data.
- `mono`: [Bool] flag for monotone remapping of `datafile_rll`.
# Returns
- BCFileInfo
"""
function bcfile_info_init(
FT,
bcfile_dir,
datafile_rll,
varname,
boundary_space;
comms_ctx = ClimaComms.SingletonCommsContext(),
interpolate_daily = false,
segment_idx0 = nothing,
scaling_function = no_scaling,
land_mask = nothing,
date0 = nothing,
mono = true,
)

# regrid all times and save to hdf5 files
hd_outfile_root = varname * "_cgll"
if ClimaComms.iamroot(comms_ctx)
Regridder.hdwrite_regridfile_rll_to_cgll(
FT,
bcfile_dir,
datafile_rll,
varname,
boundary_space;
hd_outfile_root = hd_outfile_root,
mono = mono,
)
end
ClimaComms.barrier(comms_ctx)
data_dates = JLD2.load(joinpath(bcfile_dir, hd_outfile_root * "_times.jld2"), "times")

# init time tracking info
current_fields = Fields.zeros(FT, boundary_space), Fields.zeros(FT, boundary_space)
segment_length = [Int(0)]

# unless the start file date is specified, find the closest one to the start date
segment_idx0 =
segment_idx0 != nothing ? segment_idx0 :
[
argmin(
abs.(
parse(FT, CallbackManager.datetime_to_strdate(date0)) .-
parse.(FT, CallbackManager.datetime_to_strdate.(data_dates[:]))
),
),
]

return BCFileInfo(
FT,
bcfile_dir,
comms_ctx,
hd_outfile_root,
varname,
data_dates,
deepcopy(segment_idx0),
segment_idx0,
current_fields,
segment_length,
scaling_function,
interpolate_daily,
land_mask,
)
end

# IO - monthly
"""
update_midmonth_data!(date, bcf_info)
Extracts boundary condition data from regridded (to model grid) NetCDF files.
The times for which data is extracted depends on the specifications in the
`bcf_info` struct).
# Arguments
- `date`: [Dates.DateTime] start date for data.
- `bcf_info`: [BCFileInfo] containing boundary condition data.
"""
function update_midmonth_data!(date, bcf_info::BCFileInfo)
# monthly count
(; FT, bcfile_dir, comms_ctx, hd_outfile_root, varname, all_dates, scaling_function) = bcf_info
midmonth_idx = bcf_info.segment_idx[1]
midmonth_idx0 = bcf_info.segment_idx0[1]

if (midmonth_idx == midmonth_idx0) && (Dates.days(date - all_dates[midmonth_idx]) < 0) # for init
midmonth_idx = bcf_info.segment_idx[1] -= Int(1)
midmonth_idx = midmonth_idx < Int(1) ? midmonth_idx + Int(1) : midmonth_idx
@warn "this time period is before BC data - using file from $(all_dates[midmonth_idx0])"
bcf_info.monthly_fields[1] .= scaling_function(
Regridder.read_from_hdf5(bcfile_dir, hd_outfile_root, all_dates[Int(midmonth_idx0)], varname, comms_ctx),
bcf_info,
)
bcf_info.monthly_fields[2] .= deepcopy(bcf_info.monthly_fields[1])
bcf_info.segment_length .= Int(0)

elseif Dates.days(date - all_dates[end - 1]) > 0 # for fini
@warn "this time period is after BC data - using file from $(all_dates[end - 1])"
bcf_info.monthly_fields[1] .= scaling_function(
Regridder.read_from_hdf5(
bcfile_dir,
hd_outfile_root,
all_dates[Int(length(all_dates))],
varname,
comms_ctx,
),
bcf_info,
)
bcf_info.monthly_fields[2] .= deepcopy(bcf_info.monthly_fields[1])
bcf_info.segment_length .= Int(0)

# throw error when there are closer initial indices for the bc file data that matches this date0
elseif Dates.days(date - all_dates[Int(midmonth_idx + 1)]) > 2
nearest_idx = argmin(
abs.(
parse(FT, CallbackManager.datetime_to_strdate(date)) .-
parse.(FT, CallbackManager.datetime_to_strdate.(all_dates[:]))
),
)
# TODO test this
bcf_info.segment_idx[1] = midmonth_idx = midmonth_idx0 = nearest_idx
@warn "init data does not correspond to start date. Initializing with `SIC_info.segment_idx[1] = midmonth_idx = midmonth_idx0 = $nearest_idx` for this start date"

# date crosses to the next month
elseif Dates.days(date - all_dates[Int(midmonth_idx)]) > 0
midmonth_idx = bcf_info.segment_idx[1] += Int(1)
@warn "On $date updating monthly data files: mid-month dates = [ $(all_dates[Int(midmonth_idx)]) , $(all_dates[Int(midmonth_idx+1)]) ]"
bcf_info.segment_length .= (all_dates[Int(midmonth_idx + 1)] - all_dates[Int(midmonth_idx)]).value
bcf_info.monthly_fields[1] .= scaling_function(
Regridder.read_from_hdf5(bcfile_dir, hd_outfile_root, all_dates[Int(midmonth_idx)], varname, comms_ctx),
bcf_info,
)
bcf_info.monthly_fields[2] .= scaling_function(
Regridder.read_from_hdf5(bcfile_dir, hd_outfile_root, all_dates[Int(midmonth_idx + 1)], varname, comms_ctx),
bcf_info,
)

else
throw(ErrorException("Check boundary file specification"))
end
end

"""
next_date_in_file(bcf_info)
Returns the next date stored in the file `bcfile_info` struct after the
current date index given by `segment_idx`.
Note: this function does not update `segment_idx`, so repeated calls will
return the same value unless `segment_idx` is modified elsewhere in between.
# Arguments
- `bcf_info`: [BCFileInfo] containing the date information.
# Returns
- Dates.DateTime
"""
next_date_in_file(bcf_info::BCFileInfo) = bcf_info.all_dates[bcf_info.segment_idx[1] + Int(1)]

# IO - daily
"""
interpolate_midmonth_to_daily(FT, date, bcf_info::BCFileInfo)
Interpolates linearly between two `Fields` in the `bcf_info` struct,
or returns the first Field if interpolation is switched off.
# Arguments
- `FT`: [DataType] Float type.
- `date`: [Dates.DateTime] start date for data.
- `bcf_info`: [BCFileInfo] contains fields to be interpolated.
# Returns
- Fields.field
"""
function interpolate_midmonth_to_daily(FT, date, bcf_info::BCFileInfo)
if bcf_info.interpolate_daily && bcf_info.segment_length[1] > FT(0)
(; segment_length, segment_idx, all_dates, monthly_fields) = bcf_info

return interpol.(
monthly_fields[1],
monthly_fields[2],
FT((date - all_dates[Int(segment_idx[1])]).value),
FT(segment_length[1]),
)
else
return bcf_info.monthly_fields[1]
end
end

"""
interpol(f1::FT, f2::FT, Δt_tt1::FT, Δt_t2t1::FT)
Performs linear interpolation of `f` at time `t` within
a segment `Δt_t2t1 = (t2 - t1)`, of fields `f1` and `f2`, with `t2 > t1`.
# Arguments
- `f1`: [FT] first value to be interpolated (`f(t1) = f1`).
- `f2`: [FT] second value to be interpolated.
- `Δt_tt1`: [FT] time between `t1` and some `t` (`Δt_tt1 = (t - t1)`).
- `Δt_t2t1`: [FT] time between `t1` and `t2`.
# Returns
- FT
"""
function interpol(f1::FT, f2::FT, Δt_tt1::FT, Δt_t2t1::FT) where {FT}
@assert Δt_t2t1 > FT(0) "t2 must be > t1, but `Δt_t2t1` = $Δt_t2t1"
interp_fraction = Δt_tt1 / Δt_t2t1
@assert abs(interp_fraction) <= FT(1) "time interpolation weights must be <= 1, but `interp_fraction` = $interp_fraction"
return f1 * interp_fraction + f2 * (FT(1) - interp_fraction)
end

end
Loading

0 comments on commit c123e61

Please sign in to comment.