auto_policy.py
|
[FP8] rebase main (#5963)
|
2024-08-06 16:29:37 +08:00 |
base_policy.py
|
[Feature] Zigzag Ring attention (#5905)
|
2024-08-16 13:56:38 +08:00 |
bert.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
blip2.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
bloom.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
chatglm2.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
command.py
|
merge
|
2024-08-17 09:34:18 +00:00 |
deepseek.py
|
[Feature] Zigzag Ring attention (#5905)
|
2024-08-16 13:56:38 +08:00 |
falcon.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
gpt2.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
gptj.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
llama.py
|
merge
|
2024-08-17 09:34:18 +00:00 |
mistral.py
|
merge
|
2024-08-17 09:34:18 +00:00 |
mixtral.py
|
merge
|
2024-08-17 09:34:18 +00:00 |
opt.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
qwen2.py
|
merge
|
2024-08-17 09:34:18 +00:00 |
sam.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
t5.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
vit.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |
whisper.py
|
[fp8] support hybrid parallel plugin (#5982)
|
2024-08-12 18:17:05 +08:00 |