ColossalAI/colossalai/kernel/cuda_native/csrc/kernels/include/softmax.h

#pragma once

#include <cuda.h>
#include <cuda_fp16.h>
#include <stdio.h>

#include <fstream>

#include "kernels.h"

using namespace std;

template <typename T>
class Softmax {
 public:
  struct Config {
    size_t nhead;
    Config(size_t nhead) : nhead(nhead) {}
  };

  Softmax(Config config) : config_(config) {}

  ~Softmax() {}

  void Forward(T *vals, const T *attn_mask, int batch_size, int from_len,
               int to_len, cudaStream_t &stream, bool mask_future = true) {
    launch_attn_softmax<T>(vals, attn_mask, batch_size, config_.nhead, from_len,
                           to_len, mask_future, stream);
  }

  void Backward(T *out_grad, const T *soft_out, int batch_size, int from_len,
                int to_len, cudaStream_t stream) {
    launch_attn_softmax_bw<T>(out_grad, soft_out,
                              batch_size * config_.nhead * from_len, to_len,
                              stream);
  }

  void reset_size(size_t nhead) { config_.nhead = nhead; }

 private:
  Config config_;
};
add colossalai kernel module (#55) 2021-12-21 04:19:52 +00:00			`#pragma once`

			`#include <cuda.h>`
			`#include <cuda_fp16.h>`
			`#include <stdio.h>`

			`#include <fstream>`

			`#include "kernels.h"`

			`using namespace std;`

[NFC] polish colossalai/kernel/cuda_native/csrc/kernels/include/softmax.h code style (#964) 2022-05-15 10:06:08 +00:00			`template <typename T>`
			`class Softmax {`
			`public:`
add colossalai kernel module (#55) 2021-12-21 04:19:52 +00:00			`struct Config {`
			`size_t nhead;`
			`Config(size_t nhead) : nhead(nhead) {}`
			`};`

			`Softmax(Config config) : config_(config) {}`

			`~Softmax() {}`

			`void Forward(T vals, const T attn_mask, int batch_size, int from_len,`
			`int to_len, cudaStream_t &stream, bool mask_future = true) {`
			`launch_attn_softmax<T>(vals, attn_mask, batch_size, config_.nhead, from_len,`
			`to_len, mask_future, stream);`
			`}`

			`void Backward(T out_grad, const T soft_out, int batch_size, int from_len,`
			`int to_len, cudaStream_t stream) {`
			`launch_attn_softmax_bw<T>(out_grad, soft_out,`
			`batch_size * config_.nhead * from_len, to_len,`
			`stream);`
			`}`

fix format (#567) 2022-03-31 07:05:58 +00:00			`void reset_size(size_t nhead) { config_.nhead = nhead; }`
add colossalai kernel module (#55) 2021-12-21 04:19:52 +00:00
[NFC] polish colossalai/kernel/cuda_native/csrc/kernels/include/softmax.h code style (#964) 2022-05-15 10:06:08 +00:00			`private:`
add colossalai kernel module (#55) 2021-12-21 04:19:52 +00:00			`Config config_;`
			`};`