mirror of https://github.com/hpcaitech/ColossalAI
[doc] add doc
parent
9dec66fad6
commit
633e95b301
|
@ -94,6 +94,7 @@ inference_config = InferenceConfig(
|
|||
max_batch_size=4,
|
||||
max_input_len=1024,
|
||||
max_output_len=512,
|
||||
use_cuda_graph=False, # Turn on if you want to use CUDA Graph to accelerate inference
|
||||
)
|
||||
|
||||
# Step 3: create an engine with model and config
|
||||
|
|
Loading…
Reference in New Issue