chain-kernels-ansi.h 2.48 KB
// chain/chain-kernels-ansi.h

// Copyright      2015  Johns Hopkins University (author: Daniel Povey)

// See ../../COPYING for clarification regarding multiple authors
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//  http://www.apache.org/licenses/LICENSE-2.0
//
// THIS CODE IS PROVIDED *AS IS* BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
// KIND, EITHER EXPRESS OR IMPLIED, INCLUDING WITHOUT LIMITATION ANY IMPLIED
// WARRANTIES OR CONDITIONS OF TITLE, FITNESS FOR A PARTICULAR PURPOSE,
// MERCHANTABLITY OR NON-INFRINGEMENT.
// See the Apache 2 License for the specific language governing permissions and
// limitations under the License.


#ifndef KALDI_CHAIN_CHAIN_KERNELS_ANSI_H_
#define KALDI_CHAIN_CHAIN_KERNELS_ANSI_H_
#include "chain/chain-datastruct.h"

#if HAVE_CUDA == 1
extern "C" {

  void cuda_chain_hmm_backward(dim3 Gr, dim3 Bl,
                               const Int32Pair *forward_transitions,
                               const DenominatorGraphTransition *transitions,
                               int32_cuda num_sequences,
                               int32_cuda num_hmm_states,
                               const BaseFloat *probs,
                               int32_cuda prob_stride,
                               const BaseFloat *this_alpha,
                               const BaseFloat *next_beta,
                               BaseFloat *this_beta,
                               BaseFloat *log_prob_deriv,
                               int32_cuda log_prob_deriv_stride);

  void cuda_chain_hmm_forward(dim3 Gr, dim3 Bl,
                              const Int32Pair *backward_transitions,
                              const DenominatorGraphTransition *transitions,
                              int32_cuda num_sequences,
                              int32_cuda num_hmm_states,
                              const BaseFloat *probs,
                              int32_cuda prob_stride,
                              const BaseFloat *prev_alpha,
                              BaseFloat *this_alpha);

  void cuda_penalize_out_of_range(dim3 Gr, dim3 Bl, BaseFloat limit,
                                  BaseFloat scale, const BaseFloat *in_data,
                                  MatrixDim dim, int out_stride,
                                  BaseFloat *out_deriv);


} // extern "C"

#endif  // HAVE_CUDA


#endif  // KALDI_CHAIN_CHAIN_KERNELS_ANSI_H_