|
__init__.py
|
Merge develop to main (#233)
|
2023-08-24 22:03:04 +08:00 |
|
embedding.py
|
merge upstream/develop into feature_add_moe
|
2023-09-11 16:20:08 +08:00 |
|
linear.py
|
feat(linear): optimize mlp by using jit (#321)
|
2023-09-19 14:57:43 +08:00 |
|
loss.py
|
initial commit
|
2023-07-06 12:55:23 +08:00 |
|
metrics.py
|
merge upstream/develop into feature_add_moe
|
2023-09-11 16:20:08 +08:00 |
|
moe.py
|
refactor code
|
2023-09-19 12:30:40 +08:00 |
|
multi_head_attention.py
|
Merge develop to main (#233)
|
2023-08-24 22:03:04 +08:00 |
|
norm.py
|
Merge develop to main (#233)
|
2023-08-24 22:03:04 +08:00 |
|
utils.py
|
merge Internlm/develop into feature_add_moe
|
2023-09-19 17:44:12 +08:00 |