Initialise parameter storage and output buffers for the block
| Type | Intent | Optional | Attributes | Name | ||
|---|---|---|---|---|---|---|
| class(orthogonal_nop_block_type), | intent(inout) | :: | this |
Layer instance to initialise |
||
| integer, | intent(in), | dimension(:) | :: | input_shape |
Input shape used to infer num_inputs |
|
| integer, | intent(in), | optional | :: | verbose |
Verbosity level |
subroutine init_ono(this, input_shape, verbose) !! Initialise parameter storage and output buffers for the block implicit none ! Arguments class(orthogonal_nop_block_type), intent(inout) :: this !! Layer instance to initialise integer, dimension(:), intent(in) :: input_shape !! Input shape used to infer num_inputs integer, optional, intent(in) :: verbose !! Verbosity level ! Local variables integer :: num_inputs !! Effective fan-in size used for initialisation integer :: verbose_ = 0 !! Effective verbosity level if(present(verbose)) verbose_ = verbose !--------------------------------------------------------------------------- ! Set shapes !--------------------------------------------------------------------------- if(.not.allocated(this%input_shape)) call this%set_shape(input_shape) this%num_inputs = this%input_shape(1) this%output_shape = [this%num_outputs] this%num_params = this%get_num_params() !--------------------------------------------------------------------------- ! Allocate learnable parameters ! ! params(1): R spectral mixing [num_basis x num_basis] ! params(2): B basis weights [num_inputs x num_basis] ! params(3): W bypass/output weights [num_outputs x num_inputs] ! params(4): b bias [num_outputs] (optional) !--------------------------------------------------------------------------- allocate(this%weight_shape(2,3)) this%weight_shape(:,1) = [ this%num_basis, this%num_basis ] this%weight_shape(:,2) = [ this%num_inputs, this%num_basis ] this%weight_shape(:,3) = [ this%num_outputs, this%num_inputs ] if(this%use_bias)then this%bias_shape = [ this%num_outputs ] allocate(this%params(4)) else allocate(this%params(3)) end if num_inputs = this%num_inputs if(this%use_bias) num_inputs = this%num_inputs + 1 ! R: spectral mixing weights call this%params(1)%allocate([this%num_basis, this%num_basis, 1]) call this%params(1)%set_requires_grad(.true.) this%params(1)%fix_pointer = .true. this%params(1)%is_sample_dependent = .false. this%params(1)%is_temporary = .false. ! B: basis weights (stored flat for Gram-Schmidt, but allocated shaped) call this%params(2)%allocate([this%num_inputs, this%num_basis, 1]) call this%params(2)%set_requires_grad(.true.) this%params(2)%fix_pointer = .true. this%params(2)%is_sample_dependent = .false. this%params(2)%is_temporary = .false. ! W: bypass/output weights call this%params(3)%allocate([this%num_outputs, this%num_inputs, 1]) call this%params(3)%set_requires_grad(.true.) this%params(3)%fix_pointer = .true. this%params(3)%is_sample_dependent = .false. this%params(3)%is_temporary = .false. if(this%use_bias)then call this%params(4)%allocate([this%bias_shape, 1]) call this%params(4)%set_requires_grad(.true.) this%params(4)%fix_pointer = .true. this%params(4)%is_sample_dependent = .false. this%params(4)%is_temporary = .false. end if !--------------------------------------------------------------------------- ! Initialise learnable parameters !--------------------------------------------------------------------------- call this%kernel_init%initialise( & this%params(1)%val(:,1), & fan_in = this%num_basis, fan_out = this%num_basis, & spacing = [ this%num_basis ] & ) call this%kernel_init%initialise( & this%params(2)%val(:,1), & fan_in = this%num_inputs, fan_out = this%num_basis, & spacing = [ this%num_inputs ] & ) call this%kernel_init%initialise( & this%params(3)%val(:,1), & fan_in = num_inputs, fan_out = this%num_outputs, & spacing = [ this%num_outputs ] & ) if(this%use_bias)then call this%bias_init%initialise( & this%params(4)%val(:,1), & fan_in = num_inputs, fan_out = this%num_outputs & ) end if !--------------------------------------------------------------------------- ! Allocate output arrays !--------------------------------------------------------------------------- if(allocated(this%output)) deallocate(this%output) allocate(this%output(1,1)) if(this%z(1)%allocated) call this%z(1)%deallocate() end subroutine init_ono