mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-07-08 21:03:16 +00:00
[NFC] polish colossalai/kernel/cuda_native/csrc/kernels/include/cross_entropy_layer.h code style (#957)
This commit is contained in:
parent
0e922da874
commit
1dc1b6fa00
@ -8,8 +8,9 @@
|
|||||||
|
|
||||||
#include "cuda_util.h"
|
#include "cuda_util.h"
|
||||||
|
|
||||||
template <typename T> class CrossEntropyLayer {
|
template <typename T>
|
||||||
public:
|
class CrossEntropyLayer {
|
||||||
|
public:
|
||||||
CrossEntropyLayer(float epsilon, int padding_idx, int max_batch_tokens);
|
CrossEntropyLayer(float epsilon, int padding_idx, int max_batch_tokens);
|
||||||
|
|
||||||
virtual ~CrossEntropyLayer();
|
virtual ~CrossEntropyLayer();
|
||||||
@ -22,7 +23,7 @@ public:
|
|||||||
|
|
||||||
void set_cur_batch_shape(int batch_size, int seq_len, int vocab_size);
|
void set_cur_batch_shape(int batch_size, int seq_len, int vocab_size);
|
||||||
|
|
||||||
private:
|
private:
|
||||||
void allocate_mem_buffer() {
|
void allocate_mem_buffer() {
|
||||||
// allocate local gpu memory
|
// allocate local gpu memory
|
||||||
_loss_buffer = cuda_malloc<float>(_max_batch_tokens * 2);
|
_loss_buffer = cuda_malloc<float>(_max_batch_tokens * 2);
|
||||||
|
Loading…
Reference in New Issue
Block a user