TensorRT-LLMs/_sources/llm-api/reference.rst.txt
2025-09-04 03:19:11 +00:00

310 lines
8.0 KiB
ReStructuredText

API Reference
-------------
.. autoclass:: tensorrt_llm.llmapi.LLM
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.MultimodalEncoder
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.CompletionOutput
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.RequestOutput
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.GuidedDecodingParams
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.SamplingParams
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.DisaggregatedParams
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.KvCacheConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.KvCacheRetentionConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.CudaGraphConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.MoeConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.LookaheadDecodingConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.MedusaDecodingConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.EagleDecodingConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.MTPDecodingConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.SchedulerConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.CapacitySchedulerPolicy
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.BuildConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.QuantConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.QuantAlgo
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.CalibConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.BuildCacheConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.RequestError
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.MpiCommSession
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.ExtendedRuntimePerfKnobConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.BatchingType
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.ContextChunkingPolicy
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.DynamicBatchConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.CacheTransceiverConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.NGramDecodingConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.UserProvidedDecodingConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.TorchCompileConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.DraftTargetDecodingConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.LlmArgs
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.TorchLlmArgs
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
:exclude-members: model_extra,model_copy,model_validate_strings,model_dump_json,model_validate,copy,model_fields_set,construct,from_orm,json,model_construct,parse_raw,model_post_init,model_parametrized_name,schema,parse_obj,model_fields,model_validate_json,model_computed_fields,update_forward_refs,dict,model_json_schema,parse_file,model_dump,validate,schema_json,model_rebuild,model_config
.. autoclass:: tensorrt_llm.llmapi.TrtLlmArgs
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
:exclude-members: model_extra,model_copy,model_validate_strings,model_dump_json,model_validate,copy,model_fields_set,construct,from_orm,json,model_construct,parse_raw,model_post_init,model_parametrized_name,schema,parse_obj,model_fields,model_validate_json,model_computed_fields,update_forward_refs,dict,model_json_schema,parse_file,model_dump,validate,schema_json,model_rebuild,model_config
.. autoclass:: tensorrt_llm.llmapi.AutoDecodingConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members:
.. autoclass:: tensorrt_llm.llmapi.AttentionDpConfig
:members:
:undoc-members:
:show-inheritance:
:special-members: __init__
:member-order: groupwise
:inherited-members: