TensorRT-LLMs/_sources/llm-api/reference.rst.txt
2025-06-18 05:57:03 +00:00

159 lines
4.3 KiB
ReStructuredText

API Reference
-------------
.. autoclass:: tensorrt_llm.llmapi.LLM
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.CompletionOutput
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.RequestOutput
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.GuidedDecodingParams
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.SamplingParams
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.DisaggregatedParams
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.KvCacheConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.KvCacheRetentionConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.LookaheadDecodingConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.MedusaDecodingConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.EagleDecodingConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.MTPDecodingConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.SchedulerConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.CapacitySchedulerPolicy
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.BuildConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.QuantConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.QuantAlgo
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.CalibConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.BuildCacheConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.RequestError
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.MpiCommSession
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.ExtendedRuntimePerfKnobConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.BatchingType
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.ContextChunkingPolicy
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.DynamicBatchConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.CacheTransceiverConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.NGramDecodingConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.TorchCompileConfig
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.LlmArgs
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.TorchLlmArgs
:members:
:undoc-members:
:special-members: __init__
:show-inheritance:
.. autoclass:: tensorrt_llm.llmapi.TrtLlmArgs
:members:
:undoc-members:
:special-members: __init__
:show-inheritance: