__init__.py
|
Merge develop to main (#233)
|
2023-08-24 22:03:04 +08:00 |
embedding.py
|
merge upstream/develop into feature_add_moe
|
2023-09-11 16:20:08 +08:00 |
linear.py
|
feat(linear): optimize mlp by using jit (#321)
|
2023-09-19 14:57:43 +08:00 |
loss.py
|
initial commit
|
2023-07-06 12:55:23 +08:00 |
metrics.py
|
merge upstream/develop into feature_add_moe
|
2023-09-11 16:20:08 +08:00 |
modeling_internlm.py
|
refactor code
|
2023-09-21 11:51:17 +08:00 |
moe.py
|
refactor code
|
2023-09-22 11:47:05 +08:00 |
multi_head_attention.py
|
Merge develop to main (#233)
|
2023-08-24 22:03:04 +08:00 |
norm.py
|
Merge develop to main (#233)
|
2023-08-24 22:03:04 +08:00 |
utils.py
|
merge Internlm/develop into feature_add_moe
|
2023-09-19 17:44:12 +08:00 |