bert.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
bloom.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
chatglm2.py
|
merge
|
2024-08-17 09:34:18 +00:00 |
command.py
|
merge
|
2024-08-17 09:34:18 +00:00 |
deepseek.py
|
merge
|
2024-08-17 09:34:18 +00:00 |
gpt2.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
gptj.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
llama.py
|
merge
|
2024-08-17 09:34:18 +00:00 |
mistral.py
|
[FP8] rebase main (#5963)
|
2024-08-06 16:29:37 +08:00 |
mixtral.py
|
merge
|
2024-08-17 09:34:18 +00:00 |
opt.py
|
[FP8] rebase main (#5963)
|
2024-08-06 16:29:37 +08:00 |
qwen2.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
sam.py
|
[shardformer]delete xformers (#5859)
|
2024-06-28 11:20:04 +08:00 |